diff --git a/model-00001-of-000163.safetensors b/model-00001-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b0e38683a08cc2fd52522a798b8a55fbd87e5b5e --- /dev/null +++ b/model-00001-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3207631cedd51aeb02c0b86ff6214ed51abf056ec314aff7d28317c0cef67c71 +size 8609454256 diff --git a/model-00002-of-000163.safetensors b/model-00002-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..32a9b795efc608674871cb3211d417c47290225c --- /dev/null +++ b/model-00002-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dc57f7dd9bb78fbf92c09b8e31b4af552ff67dcd7ef4aeabc612d08894bcdec +size 8602553952 diff --git a/model-00003-of-000163.safetensors b/model-00003-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..199a519da00703e85d5cb381ad71ef365acffb9e --- /dev/null +++ b/model-00003-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c723a9a927877fd28911d6b7b5b7da7755e1c1ed0f6bff4dc7e4904dad4825f2 +size 8602554152 diff --git a/model-00004-of-000163.safetensors b/model-00004-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8bd1380e376977f35ef2083fafb9cdfd10662333 --- /dev/null +++ b/model-00004-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:177580d7050b0fe2ee1294bf84bd380bfc66892bc8f7c2364969a8cc59ea8764 +size 8598786296 diff --git a/model-00005-of-000163.safetensors b/model-00005-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..edf066d8bbdb730af9b66e51b69cb27ced8e3f81 --- /dev/null +++ b/model-00005-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97a1c20c74a7ddd0c2c48d8f905ed6c945731344bc48716c35d6bbf24b3a6128 +size 8602554048 diff --git a/model-00006-of-000163.safetensors b/model-00006-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9493dc19b44b5ff89afb217ebaa2f3f324f85937 --- /dev/null +++ b/model-00006-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d17578d166a6bc5fd6a503dc769197cec3295abd6e6d23530f510b27658fff7 +size 8741916520 diff --git a/model-00007-of-000163.safetensors b/model-00007-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9dbd4720571db8e2157734dea1f33e386bdcd00a --- /dev/null +++ b/model-00007-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cba4682fdf5b5f2ae171b40126c4eacc307dee074b95dbd77a13dc36800741c9 +size 8606225096 diff --git a/model-00008-of-000163.safetensors b/model-00008-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f0d4e92f9b19ae4971af744b95cd72dfefcfdd1c --- /dev/null +++ b/model-00008-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cc76076be6c29feff6739e81112788a4137e73cd0b22522f1b6452730272744 +size 8602554144 diff --git a/model-00009-of-000163.safetensors b/model-00009-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b3f06d03a8111cfd32173f7795ab25c896cf48e6 --- /dev/null +++ b/model-00009-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:730ac3628d7b4ef5767af5675ec4cb91e83eb788c62e9c5b73a5913c22254a3d +size 8598786392 diff --git a/model-00010-of-000163.safetensors b/model-00010-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..eeb4c7c9b61f83cb71ec2ccc5c8631826b63d9f9 --- /dev/null +++ b/model-00010-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03f0871c1a36da435e06df57fa79d73e2ff37d10d16ea4682c69245fcfda49ea +size 8602553952 diff --git a/model-00011-of-000163.safetensors b/model-00011-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..977cff8a52e51f0af7e2b7ad7975f51ad9ec1b86 --- /dev/null +++ b/model-00011-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c2f899101d5e6a018a50fff7d995db0d19273b7d4a68d613d7b868509c8df31 +size 8602554152 diff --git a/model-00012-of-000163.safetensors b/model-00012-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cfdf4641055002388b40a22a6dbb25580eaab444 --- /dev/null +++ b/model-00012-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15d803fbb82b55bc87b759b9ed8b08b8f993a76f8e3ee2d2519fba7d31d0bb97 +size 2642451624 diff --git a/model-00013-of-000163.safetensors b/model-00013-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dd63f74b4a2b9ce8e10e94032dc7ac28819252ad --- /dev/null +++ b/model-00013-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e89f227f5d8f92d440f720840b18fc1b142384a01f1ca353db5dfbe091d4eb5c +size 8598757320 diff --git a/model-00014-of-000163.safetensors b/model-00014-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e4655265d0b96108b71dca3697133a6d4bb08451 --- /dev/null +++ b/model-00014-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52d742ae7cd6a27d8ec79984b77e8fb3dbd0ad6d5771d37c20f6ba84a7b212d6 +size 8602554136 diff --git a/model-00015-of-000163.safetensors b/model-00015-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2c8c0c2b5c929571ff59dcab9e4590ecc567ba2d --- /dev/null +++ b/model-00015-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:939995f6518a1f30c42b3617562d64e72fea83aa928514c9717441ac722c74ec +size 8598786408 diff --git a/model-00017-of-000163.safetensors b/model-00017-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..eb15922e06244a27092ca31ec48161a7ac5fbcbf --- /dev/null +++ b/model-00017-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e0fe4fae7af83a971d51f03583d7f219a0de8c3cd803e1bf6bb54c77fbb1f4a +size 8602554152 diff --git a/model-00018-of-000163.safetensors b/model-00018-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2ff2129383a3e7ec54d63590d34821a324a13b22 --- /dev/null +++ b/model-00018-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77447d81964156d38316bf608c71ea4a01f500fdcd2442750ca0ed588547a1c4 +size 8598786312 diff --git a/model-00019-of-000163.safetensors b/model-00019-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dfababeb608f64802439eac20557fb5cbfe2cfde --- /dev/null +++ b/model-00019-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba2416b54abfd60da6212449eaaf2a4fe4a79c9f00da49fac3cc9efcbad9ac2c +size 8602554032 diff --git a/model-00020-of-000163.safetensors b/model-00020-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b442b62e933915d2e5347190eb0efa57d1928516 --- /dev/null +++ b/model-00020-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:548ecb72f9df18bfc099096acde328b2f7543b211146e6143352ca79fbbb0af4 +size 8602554160 diff --git a/model-00021-of-000163.safetensors b/model-00021-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9b4f1c40f3f8ce8b621b9f924eb5f8c37b49082c --- /dev/null +++ b/model-00021-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af1a5fa98d1256daf6c958154e7aa062240cd4f23051bb237c06a066c066f2a5 +size 8598786512 diff --git a/model-00022-of-000163.safetensors b/model-00022-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3b6c952adc5f591566ed3cada720d396d88b4055 --- /dev/null +++ b/model-00022-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef490236152246dce9556fdd1d0bc1087379201c8599a060deb0caaeaf680432 +size 8602554416 diff --git a/model-00023-of-000163.safetensors b/model-00023-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..52f423aaa34e7a5a01936bd0599f99a9474655a6 --- /dev/null +++ b/model-00023-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f559b80a5154247e7e46612596cb7f62f51342efda16b47b47a25db020219c8 +size 8598786704 diff --git a/model-00024-of-000163.safetensors b/model-00024-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..16fac88d2195b7035527b6cac05ef1a1462cdf72 --- /dev/null +++ b/model-00024-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ae441a1e64a950846ca332cdc0b8da025c7807f9e44d3b88a0621980d9c9cdb +size 8602554224 diff --git a/model-00025-of-000163.safetensors b/model-00025-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7a21fca0f26c366516eeb0a7787025a8713f5aba --- /dev/null +++ b/model-00025-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58fa8109385cc3b21e1891889ab17194c819451d1ddff9d415dddf9ce01827aa +size 8602554448 diff --git a/model-00026-of-000163.safetensors b/model-00026-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..227ab1353a75d5a784f95f0b3a55bfb3a2a13367 --- /dev/null +++ b/model-00026-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06496b075d9470852f0f0e9f80020cb82bc2a8dd2b772014e6e7d97bb68a0d4a +size 8598786616 diff --git a/model-00027-of-000163.safetensors b/model-00027-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6a94ec3b15a5932444a69f1c85886f8eb7e6e2bb --- /dev/null +++ b/model-00027-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72984f02ea496d07f6cb8ee6561c1fc19aa5d7cbe388ebaaf73014550ae3278f +size 8602554312 diff --git a/model-00028-of-000163.safetensors b/model-00028-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7759cac9b4a6e9c77c0c6c20843533cffce5ef7c --- /dev/null +++ b/model-00028-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7eb8b1919c8bdf37fce18784530545d705b71e061d5c3b300d60381989e23ba1 +size 8602554448 diff --git a/model-00029-of-000163.safetensors b/model-00029-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1c17326b117335fba7401de9556f88549cd4b1b8 --- /dev/null +++ b/model-00029-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdef0d17a9c42b9509c984c15425616fc85434f8e1bf6fd81673b6d436c89451 +size 8598786520 diff --git a/model-00030-of-000163.safetensors b/model-00030-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..193df77fc104c249ef34de1c1919cb612cf654bb --- /dev/null +++ b/model-00030-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce2258bd15c06341bf84ed0859e99e3102bccf6f495b9553f20e42df81c301ec +size 8602554408 diff --git a/model-00031-of-000163.safetensors b/model-00031-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..454775f1f85ff6db4bd9e9767ea6d2fd13741ad2 --- /dev/null +++ b/model-00031-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b669917dee5c37e0f3b0323022412a97b0cc57f1d96ce33c0af339e95867d02 +size 8598786720 diff --git a/model-00032-of-000163.safetensors b/model-00032-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..efb78df7114cd734db5d1768c59c4d3beff69e33 --- /dev/null +++ b/model-00032-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87700991adde934c584e0d95c7f08cf65a8aede4eb11fe0a59051561ecb43373 +size 8602554208 diff --git a/model-00034-of-000163.safetensors b/model-00034-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a42999a5e5bad2bb474681d687c6d2ebdcd354ed --- /dev/null +++ b/model-00034-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d6d9b50c22921ee6d4016ef740e563e6793b1e7e69271af034560163e5773a8 +size 3493899088 diff --git a/model-00035-of-000163.safetensors b/model-00035-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..313be3bf07b61e42b5921151c44d13e7fe068e92 --- /dev/null +++ b/model-00035-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccf60d27e1404a8d9388f248f1add5389a11f01a0db7a4d75ce6c1b41737b0d0 +size 8598757608 diff --git a/model-00036-of-000163.safetensors b/model-00036-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..beee33594f357c236ea8fc88ef49188f07ad22c0 --- /dev/null +++ b/model-00036-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be27480b4cbad66be5b86b240b14a05adff9680b8a80df4f045ab32929541a6b +size 8602554424 diff --git a/model-00037-of-000163.safetensors b/model-00037-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..96d6c3488c5d6126a29bdcbd2f8c22f8f3ea4819 --- /dev/null +++ b/model-00037-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e412d97eb628974859b51833fc104a63ff988e9d7e1d4b7fca705287f71152e +size 8598786704 diff --git a/model-00038-of-000163.safetensors b/model-00038-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e85d9c2a90480ee36dd033f1a47e8687f45acb54 --- /dev/null +++ b/model-00038-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6ecd6fcb8a6ba1553055afa8b4c13bba25faf30d2f929ff9a156d4f0cba4d45 +size 8602554224 diff --git a/model-00039-of-000163.safetensors b/model-00039-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0c5c5af23933b578bd012b3bb1ae455d712f0938 --- /dev/null +++ b/model-00039-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c023e80b0a6bcd2d3585772a9d313d6d7517b811b6ec62e66018573e500cb4cd +size 8602554448 diff --git a/model-00040-of-000163.safetensors b/model-00040-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..83fbdd59b63e8c27e6c58d8150383beecefa117c --- /dev/null +++ b/model-00040-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:408c62feb72975f0d3b0c3453eae71e8e2328f698bd156fbe2f009748c98bd37 +size 8598786608 diff --git a/model-00041-of-000163.safetensors b/model-00041-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d93a400599551f7ea2a5868a88d01a5cc88ec596 --- /dev/null +++ b/model-00041-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a40c9c131f7204c27757c016057ca52c3f4f73a928a47fbc893a09b72cb2211 +size 8602554320 diff --git a/model-00043-of-000163.safetensors b/model-00043-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..134804cb82cdb61dac791281a17a880171c29811 --- /dev/null +++ b/model-00043-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b51315a6e5a494183db094d98abc30795f3ecbab4173e35880b47c92596d5845 +size 8598786504 diff --git a/model-00044-of-000163.safetensors b/model-00044-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..022105e3467026bd84444be63382cf8ec692b8de --- /dev/null +++ b/model-00044-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f69435553f07ac34ffc91209db483e72b609b5ccb3ce5caf8063d5f3d9f53b39 +size 8602554416 diff --git a/model-00045-of-000163.safetensors b/model-00045-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bb601e069fd4f05ed4fab486d04856a8736e712a --- /dev/null +++ b/model-00045-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:422155dafef6d2a0cb23a97ce346c288c5dfee965b791ab08a1ab11c7a68fa0f +size 8598786704 diff --git a/model-00046-of-000163.safetensors b/model-00046-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..887681ab05cd65520b5b25f658362d44cb36a07f --- /dev/null +++ b/model-00046-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf12d9f584ab0a46b3ea9507b83ec796664fce4de7ef459ccb75bf7481561ea8 +size 8602554224 diff --git a/model-00047-of-000163.safetensors b/model-00047-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..516ffcfef9cca66781b2bba10e1b0d71b79aab76 --- /dev/null +++ b/model-00047-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:234a8286a23bee608d9d65eafa5d2391fce13b22b8c21e23f3682e89dd1598c4 +size 8602554448 diff --git a/model-00048-of-000163.safetensors b/model-00048-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cec6571c0277ac1203b7f87b268ce46bd6b1dcb0 --- /dev/null +++ b/model-00048-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66239cc48fb9584dc29b2ecd85182f8cd91be19d91239f5dbf7fdd123cb2ee22 +size 8598786616 diff --git a/model-00049-of-000163.safetensors b/model-00049-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cd0ca909e8fe785697a59030e1c139a331e319c5 --- /dev/null +++ b/model-00049-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df92249d2162e2237eb7780d797fb60cd069f868166507de2194d16fc0697c6d +size 8602554312 diff --git a/model-00050-of-000163.safetensors b/model-00050-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..30df233608b8ce488367b56c29de9c2174e2805b --- /dev/null +++ b/model-00050-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51d5b5c0f5cb21eaebc30012df0365d1f88c73be1b237138fb7d57797c25f0b1 +size 8602554448 diff --git a/model-00051-of-000163.safetensors b/model-00051-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bf109d9b83a0c5bb5025ab05e2849d8cae9c70ac --- /dev/null +++ b/model-00051-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbeddb7da0d3130b3dc6be1f2a02672756b02b9efc7a9e5456eb5a9a6ad30f55 +size 8598786520 diff --git a/model-00052-of-000163.safetensors b/model-00052-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..52523152349806138ea2b10dc6066086ea16377b --- /dev/null +++ b/model-00052-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a3d6a6664894c10f39fa75858d5dd96ac645e355a54cb24a7caecaaa3e0819f +size 8602554408 diff --git a/model-00053-of-000163.safetensors b/model-00053-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7d6b7ba0553637496fe3a8926cb421f7c23a2fa9 --- /dev/null +++ b/model-00053-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2a27cc21f7bf992127d8997eec678e6b2bbcc9e4c5aa362115545a69a938ce1 +size 8598786720 diff --git a/model-00055-of-000163.safetensors b/model-00055-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b34b99dcee3909ceb931cdcca569ce06edd71097 --- /dev/null +++ b/model-00055-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:187d2d2d3d8ad7ecf1b52c22189d90d64f06abb195db7d0c3b3cc98d5460b1e2 +size 8602554448 diff --git a/model-00056-of-000163.safetensors b/model-00056-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2adb205af5fbc136c16d860ae0d997deb9f20d29 --- /dev/null +++ b/model-00056-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:974dedf0fbeeca625438bbcc6c6a6bd32cbc2c72d1e2990d8c2491beb5a298e5 +size 3493899088 diff --git a/model-00057-of-000163.safetensors b/model-00057-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..41c4a8a2ffc95f34c967038b43eb3005717e5a18 --- /dev/null +++ b/model-00057-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bd49957792f9ffc2be608510ad3ac0e742feb6c0c89c562c38b9de042c4411b +size 8598757608 diff --git a/model-00058-of-000163.safetensors b/model-00058-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..140467c87f46d09a2044bd1739eaa2894ce9f7ac --- /dev/null +++ b/model-00058-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca9d47d82daa2ddb66bf7c6e1f9fcae241958a18f4b0d281220d0f651b06d007 +size 8602554424 diff --git a/model-00059-of-000163.safetensors b/model-00059-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f57b6ff08e96e4cba39b2e49f8ba517672656b77 --- /dev/null +++ b/model-00059-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c61fa8774a9ce21d850151b59680823a231865b925d5835b73bedcaca02747f +size 8598786704 diff --git a/model-00060-of-000163.safetensors b/model-00060-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..77efe094d0624e2be51489282fd7f33d3bedffa3 --- /dev/null +++ b/model-00060-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d88adda03760b646641aea1a8d4c5c03b59a6f9ee0a0348bc79d7c38a87e8af0 +size 8602554224 diff --git a/model-00061-of-000163.safetensors b/model-00061-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d59be675e34f34cd93f2ac659c27800df6af7c8e --- /dev/null +++ b/model-00061-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdbf3aa95b7375f5fb2858c34f29f66a8ad8f011bc5f0c371e8fef1be1af8bf8 +size 8602554448 diff --git a/model-00062-of-000163.safetensors b/model-00062-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..995cddb06fb7d7b2454c0e640fd942b5700603a9 --- /dev/null +++ b/model-00062-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df55a04fbdbb4d61bc1872935fcbebe5525c2d383961f4bb2b731c36b542dae8 +size 8598786608 diff --git a/model-00063-of-000163.safetensors b/model-00063-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6c9dc7249a5e97d3fad32635583198ab3cdcee8c --- /dev/null +++ b/model-00063-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2919b14ad774ba5c6d1286cb5ff7ac599bf6149512fe5734c3524469c693be0 +size 8602554320 diff --git a/model-00064-of-000163.safetensors b/model-00064-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b2fc091c0e0e32f4dd2c5ede0598411444db21e9 --- /dev/null +++ b/model-00064-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:733a7f88d9af785cf656459f1ec22d3605e3980472d5160682976c8e813d7ee0 +size 8602554448 diff --git a/model-00065-of-000163.safetensors b/model-00065-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1470cf38c4abd52a04ab56e4c77f5e6fcd978071 --- /dev/null +++ b/model-00065-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22273396ba73c330e2af49a06e4ee1b54f5ed2e3b09eeadca6fe669c8160f925 +size 8598786504 diff --git a/model-00066-of-000163.safetensors b/model-00066-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3a9a735ba7288c898846b6b6f4302b3949ac4dd3 --- /dev/null +++ b/model-00066-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00bea9a0947a5b6e61995f5e3b90cc1e0764563e3abfb206b6f6b662c87db1c6 +size 8602554416 diff --git a/model-00067-of-000163.safetensors b/model-00067-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8ffab17ec124636487c7425019d07363f89f8740 --- /dev/null +++ b/model-00067-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6b6e61408123d9a5771e0d035e3d281d9dd063ea2f8b848443d025cd1da896b +size 8598786704 diff --git a/model-00068-of-000163.safetensors b/model-00068-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b6a1e6c235ecc99950d0bbe1600c0bc703e31347 --- /dev/null +++ b/model-00068-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70c85c91669b4e37cf1a9a655db3eee38928b22288b303ad104f49b5fb4b67fc +size 8602554224 diff --git a/model-00069-of-000163.safetensors b/model-00069-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f236523ca6c48668ebc88041f6cb2c1a29efc120 --- /dev/null +++ b/model-00069-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbcea7d9ea100c00409cf35a2c31f47e4e1087978f268192bb1955224686666a +size 8602554448 diff --git a/model-00070-of-000163.safetensors b/model-00070-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bef459d7359e39c937fc08c3b416d52094b31c38 --- /dev/null +++ b/model-00070-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa0705b0044fc73fb171cb5a53c762f1fabde40c5a5ab91941890ed1f48392ce +size 8598786616 diff --git a/model-00071-of-000163.safetensors b/model-00071-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5ee66ed198044b1aa043d6391f06af8626302534 --- /dev/null +++ b/model-00071-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10aaf82262a27857d375acb336c096a48d19609a4b35e012f8558b792c4dc04c +size 8602554312 diff --git a/model-00072-of-000163.safetensors b/model-00072-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a840b185bf562c46cc752e0c05a4e5d0d7f2a8a6 --- /dev/null +++ b/model-00072-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31674efae31045a896cd210274bb941605412318e3bd542f6d4c71430c39bc00 +size 8602554448 diff --git a/model-00073-of-000163.safetensors b/model-00073-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..32d79031f407dd75969cec2decd2daca7332138e --- /dev/null +++ b/model-00073-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83549aa6bd9bbf90e1660d025f2c9306bfccd14631b9335fba54a32a6c59c15d +size 8598786520 diff --git a/model-00074-of-000163.safetensors b/model-00074-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..66177d17689cadc24966fb9cdaa7a7967676e5d4 --- /dev/null +++ b/model-00074-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6724dbf6490e2b2c6d9361c0a67521d0cb4a0f116ba5fd3b591bd369a8692f9e +size 8602554408 diff --git a/model-00075-of-000163.safetensors b/model-00075-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ed1607c1cb3cb79ae9a991745b468d5e7e841c84 --- /dev/null +++ b/model-00075-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57e88f03a5112552d0b3cbaadffde36cf27147239ffba4de84554a3734b2d9c8 +size 8598786720 diff --git a/model-00077-of-000163.safetensors b/model-00077-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0d1cbfc2ceb44fb8542953f0e6726f31ec97572b --- /dev/null +++ b/model-00077-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c277d3e9b52b329fcc5f0be5a65de2bc564d2ee4035d30d755c061d754055542 +size 8602554448 diff --git a/model-00078-of-000163.safetensors b/model-00078-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a393ec0514cb523eb79627d7492ca3afdec83ef8 --- /dev/null +++ b/model-00078-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d7c716982cf04afad9f91c2ea1bcf3c94356f137ea7c353d83ceb50628952b4 +size 3493899088 diff --git a/model-00079-of-000163.safetensors b/model-00079-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ffd6a0cf5ac49058e8733b8b9ac7db2f089342bf --- /dev/null +++ b/model-00079-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffa811d315e6ca92bcd93978b19fa2db8fea30aab23df9ad6c919dd4288c0056 +size 8598757608 diff --git a/model-00080-of-000163.safetensors b/model-00080-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d44cd05f8ba093c4a8385acd7f551cfc7e3f8aa8 --- /dev/null +++ b/model-00080-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb53873ffaee362d163367d4a96c8298e037ccbf6c2e46a29e75a5282255a822 +size 8602554424 diff --git a/model-00081-of-000163.safetensors b/model-00081-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ecae049a67c3e7c8f0d4760f865bb022483df534 --- /dev/null +++ b/model-00081-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99e2bf23cd596da1e01e2758d4a3535c9abd09c14b51a43586cc45a61225fd16 +size 8598786704 diff --git a/model-00083-of-000163.safetensors b/model-00083-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e406f23c783726d87acefe59cc0e94871d8b9e1a --- /dev/null +++ b/model-00083-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a86a605ce9d7228a913e0269fa35ac8bb3b983367a5fd9dcea99a923879a5b5 +size 8602554448 diff --git a/model-00084-of-000163.safetensors b/model-00084-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d1e10e8f68fa9e74e84ba1b00b6096940f4c26e1 --- /dev/null +++ b/model-00084-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4637c7e3bbb2cc223b2b31f6064dafd92505d5643621baf8883f2691f5a8cb1a +size 8598786608 diff --git a/model-00085-of-000163.safetensors b/model-00085-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..252777dd059ed452c0b0d515dd23003090ced833 --- /dev/null +++ b/model-00085-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b28170e23c16ab6af490a57310d308942f38394a41743132d9537400565bb5d +size 8602554320 diff --git a/model-00086-of-000163.safetensors b/model-00086-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9033c853921e7c98d5f4e9a04b238452d6318f56 --- /dev/null +++ b/model-00086-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37684ae5e8c7643ba2e4b8c73ea99a6682cf2558afa7544311335e184252ea3f +size 8602554448 diff --git a/model-00087-of-000163.safetensors b/model-00087-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..50b5d30e7db386100f1b3663ccf5c56526865379 --- /dev/null +++ b/model-00087-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ab902e5ef27a3c3822bdd81facd7a5a204d7fb297f8fd798f8ba9a5133bfa06 +size 8598786504 diff --git a/model-00088-of-000163.safetensors b/model-00088-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c0f2ca6b8c02208f100a25cf920eaf66dc084125 --- /dev/null +++ b/model-00088-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce62f35a483a71399cf5ec020171556e1fa59d47cf264448cc1d8c3b3d50ecec +size 8602554416 diff --git a/model-00089-of-000163.safetensors b/model-00089-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a637972f772005af307f7c71f196d4cd4207dc1b --- /dev/null +++ b/model-00089-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca60c7753be9ab1d1c373bd6e34c5c2adf672308bc2a3197b8068b2998fd6304 +size 8598786704 diff --git a/model-00090-of-000163.safetensors b/model-00090-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9b8ba438a383f1f565d14160d5a9ddb9ff495c0c --- /dev/null +++ b/model-00090-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae0a71081d0e9ce67d361ea709fdf1ffe15b67372644e8d17a384e9a2e2b9de5 +size 8602554224 diff --git a/model-00091-of-000163.safetensors b/model-00091-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5f77f171fe924642ec0e17a49e9be701efd02d5c --- /dev/null +++ b/model-00091-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:baf9e547cfee50da6fdab1eb8a7e75ce84629ae530aa8a28fd3710d1979b44be +size 8602554448 diff --git a/model-00092-of-000163.safetensors b/model-00092-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e78f6da3b00cb2f3ce2e84b1a2a041d95abad803 --- /dev/null +++ b/model-00092-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0ee2bfefc79e57b91af8ee0ebdb48a9c37cd2be5b45fec02b66108269bf8fd8 +size 8598786616 diff --git a/model-00093-of-000163.safetensors b/model-00093-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f9c62f753face595640b5a32d91e115c8eb36ab8 --- /dev/null +++ b/model-00093-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:368e4745c45b8017fe832774f593cfe6e27f98ab828b49e5e915b5fbe912deaf +size 8602554312 diff --git a/model-00094-of-000163.safetensors b/model-00094-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..101d9ad85d89a230e602e0b56306c5284c122cb7 --- /dev/null +++ b/model-00094-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76c54b159c39eab332aef6df08e1e8bdad3371848eb6d9228f173655c1eb189b +size 8602554448 diff --git a/model-00095-of-000163.safetensors b/model-00095-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3b115e1d39bb5a0554d556c464020ef9c3a6d5a1 --- /dev/null +++ b/model-00095-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98369716825456e68b68f0070c2f5ff5ca4c8e6508c7f122f0b08d51d6a1509e +size 8598786520 diff --git a/model-00097-of-000163.safetensors b/model-00097-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8f8ca3e7a7a770396ee581e195eddd8a1fd16cb0 --- /dev/null +++ b/model-00097-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831952d25b160cbb8bd1426267a2d0a8103d87973f4ed8c3e55a56f0bce8a78 +size 8598786720 diff --git a/model-00098-of-000163.safetensors b/model-00098-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f73d5d4d49646534608fbd1fca1f4fc850c1418a --- /dev/null +++ b/model-00098-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d46ed04ba51bac8bd342b621ef27b2ef5fe7c9bba6da32744a9ca78179763bb +size 8602554208 diff --git a/model-00099-of-000163.safetensors b/model-00099-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..087ee5d2af56991ac7abba5438c80c32accd14d6 --- /dev/null +++ b/model-00099-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6709d9658832bace0b7f048281131e3ce00afb285ac0139106af82112283c0c5 +size 8602554448 diff --git a/model-00100-of-000163.safetensors b/model-00100-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a46284a3d08459b048d0eab46534a015b2a586d2 --- /dev/null +++ b/model-00100-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d18726836d624e22899f8a0515902e26b2e8f6b6cc1c760efce7a86be9f05eb1 +size 3493899088 diff --git a/model-00101-of-000163.safetensors b/model-00101-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..29114cbcfd97db4ab4c812cdc706e5699e08b9ea --- /dev/null +++ b/model-00101-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbe1d3d9a2a231ccbf79243b7d34e31ebcf1bf51367cd9c4f8d5b8d3daf746ae +size 8598757608 diff --git a/model-00102-of-000163.safetensors b/model-00102-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2302f9a9755e6ca8727b67bff9a302a313bd278a --- /dev/null +++ b/model-00102-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:508b1ad64ff8b2d8b3d9213e3cada0040ed3a526357f2fb6f0acdc58285b8fa4 +size 8602554424 diff --git a/model-00103-of-000163.safetensors b/model-00103-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d465d18cb77f24a38e94d3dc3b864f9ee630ac69 --- /dev/null +++ b/model-00103-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:745692de7d84c56d847414f232f392b3b55a79a78667828c810faa0f79c7c78c +size 8598786704 diff --git a/model-00104-of-000163.safetensors b/model-00104-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2f4c7599ad83a22b7a0e63541be9f13054dea9e2 --- /dev/null +++ b/model-00104-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5742b647d68bcb13f36c8d98240514b71d0b3b325de59f1ad5a4910f2d3c00b9 +size 8602554224 diff --git a/model-00105-of-000163.safetensors b/model-00105-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e0ac86b0159341eae0f8a26fc6e5fcbcd9275d21 --- /dev/null +++ b/model-00105-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aefd75deb2fd7f297b87a2cc5de027afe6dd299b779aa7fe714b5510fa826f74 +size 8602554448 diff --git a/model-00106-of-000163.safetensors b/model-00106-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8ddfe7e8b6d1c9192bd6e80b6f32121a82661cd3 --- /dev/null +++ b/model-00106-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4b74d7f61c2bc9e45cedc9d06e02c02df3e6e455e8ff74b877906817827dea0 +size 8598786608 diff --git a/model-00107-of-000163.safetensors b/model-00107-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..62ecd6b7dad889e42dbe618fc51176408509237d --- /dev/null +++ b/model-00107-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd90d7da3b9852c34ab5245bb7f093cbbc86e2b5d5b47cf666b6cd31ee9e6ea4 +size 8602554320 diff --git a/model-00108-of-000163.safetensors b/model-00108-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..766a5f7714639a870fb7a21eee928a8e0b7b1c43 --- /dev/null +++ b/model-00108-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5bece39f330eb8b410f7a76f66516ef905f9facf3d88a13b2d6d9ad850be16e +size 8602554448 diff --git a/model-00109-of-000163.safetensors b/model-00109-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..529bd1d9b8eb8c7035f5d9d5447b7103483b8003 --- /dev/null +++ b/model-00109-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8d8a85e7647a5b0252e999b7fa7ba9726478bce0225d5adbe98df5ff4a5d97a +size 8598786504 diff --git a/model-00110-of-000163.safetensors b/model-00110-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f63038563679d6d93e39075a2883e372c1c19f8c --- /dev/null +++ b/model-00110-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2884328bce3ffb6f48f11e583761e6474e1fd60c22908327739bc0eff4c5aab0 +size 8602554416 diff --git a/model-00111-of-000163.safetensors b/model-00111-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..03d48cbec16b85077ae24d63137d420e0207dcaa --- /dev/null +++ b/model-00111-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12dbe09a637c7777b0ada857d9cc0909cb8c49c782c5557987a932c4215f2830 +size 8598786704 diff --git a/model-00112-of-000163.safetensors b/model-00112-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a5dd13a1720f00382e2012bf340cce83b36b264f --- /dev/null +++ b/model-00112-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7566eff77a9438992e3f1a4b57d7122a79dd41fea87870136e796deeb36569c9 +size 8602554224 diff --git a/model-00114-of-000163.safetensors b/model-00114-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..818c6d9a55e0945e68dc102498a31c595bd6c8cb --- /dev/null +++ b/model-00114-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c102ddfe9204bfe8a3f2422da47dfb00860b51c51d6dbd5f41d23280bb1c286e +size 8598786616 diff --git a/model-00115-of-000163.safetensors b/model-00115-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..94e58ee9dc7bbe05275aa49004d6e9e446f18aa4 --- /dev/null +++ b/model-00115-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e68478f93421a1701306a9b38adf60733bdcdf4116a47bdfe49af9716b9dc530 +size 8602554312 diff --git a/model-00116-of-000163.safetensors b/model-00116-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a7223d99712fb5e7e3302671acb336fea0b68702 --- /dev/null +++ b/model-00116-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03d3701208ed54fe54db941a92139a8c672d5f587e7a3896f85adea5ce022309 +size 8602554448 diff --git a/model-00117-of-000163.safetensors b/model-00117-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d4e61876ff87ba849eb4ff8b579b3d9f45201fd2 --- /dev/null +++ b/model-00117-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de3f39174f7f42db2a154b91c7d0fd113bf788e2d259239320e5f50d2c207a5c +size 8598786520 diff --git a/model-00118-of-000163.safetensors b/model-00118-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cde14be8ef9eb0315e97dc6ec6c76fcf8b11b15b --- /dev/null +++ b/model-00118-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:040911a6df205b14de824659c5b33c617578b08482c757c24e159053e159da47 +size 8602554408 diff --git a/model-00119-of-000163.safetensors b/model-00119-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d8ca3ab3c423a55a32e986a3c4602d1bfe3bbf7b --- /dev/null +++ b/model-00119-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f05ac08a43fefb9d7028388897e601954c5f5b7f64ebef80d8aa74a7cfee746 +size 8598786720 diff --git a/model-00120-of-000163.safetensors b/model-00120-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..058f8eca113654a5af256b0561358900ca8d150c --- /dev/null +++ b/model-00120-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c3d91cd4793e50bfc39a2d41434e68c176f5adf387a7291f40cb43d3a6cdf45 +size 8602554208 diff --git a/model-00121-of-000163.safetensors b/model-00121-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3667778d6e5d436f6302d40d16717d0e79042e73 --- /dev/null +++ b/model-00121-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ffb06abb506dfe7aabbbb5a08bf6fbb318e0d64935ec9a962fd1aeddaa2ce9b +size 8602554448 diff --git a/model-00122-of-000163.safetensors b/model-00122-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cd699640bf72ef315935e8376fd2849fc1eb1981 --- /dev/null +++ b/model-00122-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b62f5396680f187966be39d78e3000303cb9dd8e4d0c91622bbe7a56042cb59 +size 3493899088 diff --git a/model-00124-of-000163.safetensors b/model-00124-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8c1c741bb137bc2b075f5dd5b7f850b7e736f1ff --- /dev/null +++ b/model-00124-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d78401c9c3726d9490e21ee3b09394748fbd5c8fea4c696be832cc663bcfc89d +size 8602554424 diff --git a/model-00125-of-000163.safetensors b/model-00125-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..363a79ceac4f7adb3a7ba081b7163d72a3f15332 --- /dev/null +++ b/model-00125-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1366c5502fad14563b4b7e052c805cb8d8caeccc887a3dd7f8665e8e3631b3a +size 8598786704 diff --git a/model-00127-of-000163.safetensors b/model-00127-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5fd409ba72803f48cfdade69ff22e64a5cd98f77 --- /dev/null +++ b/model-00127-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:902f6f5de79e9a3ae646d82d70948f4764f8061f468f2febf814fcc72f5d0bb5 +size 8602554448 diff --git a/model-00128-of-000163.safetensors b/model-00128-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..299051115f948e9becc46bc5db2159a43134112b --- /dev/null +++ b/model-00128-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02aafba6b65f9727558a0cefa35ffe40dbe230995d0777ececc4bc226e65a391 +size 8598786608 diff --git a/model-00129-of-000163.safetensors b/model-00129-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8d5f01faa156b33af5ffbc68e13e5200126483e3 --- /dev/null +++ b/model-00129-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5e520349e5b528a5f5d09911cb93b364990d2b92c7f196b653802871a78325c +size 8602554320 diff --git a/model-00130-of-000163.safetensors b/model-00130-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..867b4334744f5cd63108c6de01191d6f5f05588e --- /dev/null +++ b/model-00130-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30a50b3526cd817a28d15866cafd36f2e711293a77218638e864f2fbbabdaa09 +size 8602554448 diff --git a/model-00131-of-000163.safetensors b/model-00131-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ccadbc4204d6a8a62f1432bddfe8e17f467825e8 --- /dev/null +++ b/model-00131-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06542ec0ae43961d4e4f5e358d5bee46e8ead652a6479fb435b5b7f8c65ee4f9 +size 8598786504 diff --git a/model-00132-of-000163.safetensors b/model-00132-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..76c3fc6a011fa156f1d3fc6f374b2cb1ac69240c --- /dev/null +++ b/model-00132-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e49f43e43d5b064082907c7d1f66ba4e42cf31c06ea171aaeef5c1e77d710b8b +size 8602554416 diff --git a/model-00133-of-000163.safetensors b/model-00133-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0a378876249aab0de1e8c8f48d7e6c71e4847dec --- /dev/null +++ b/model-00133-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab5016016eb3942f1db277c78e4286d71129b611438e16971a6e52df33c0e8f1 +size 8598786704 diff --git a/model-00134-of-000163.safetensors b/model-00134-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..10ec2acc49a06ba521c0e9827f9ae6f2301c25a4 --- /dev/null +++ b/model-00134-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e914a782c6156eebc49c0851cb87e65ab24ea85c17ae1caac3ae536b3ac12f1c +size 8602554224 diff --git a/model-00135-of-000163.safetensors b/model-00135-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..39fc453a92f2011725def2cfa73a76016a0906d3 --- /dev/null +++ b/model-00135-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f22fe563247141ec5a468add5f153e24fbd3a5d63f899b80f05451dfdd5a299 +size 8602554448 diff --git a/model-00136-of-000163.safetensors b/model-00136-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1cc568f8dbfdaea4692cd8ed9c426f6b2f18b235 --- /dev/null +++ b/model-00136-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a993607af2cc4ff1afd5a301055ef16c639a53c638554d25c1e4749351131132 +size 8598786616 diff --git a/model-00137-of-000163.safetensors b/model-00137-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..964172853b9d9778837af7d0c2b91b53ddbc931d --- /dev/null +++ b/model-00137-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10e79a7f3dbb38c2e84dd4eae2900666d9ebeb3c9711e679b8e2aab57bc3661f +size 8602554312 diff --git a/model-00138-of-000163.safetensors b/model-00138-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bbefd7cba6e8c06cf24985a5c44d26c0a1cca297 --- /dev/null +++ b/model-00138-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dce87b4b389f0629de4dbfa49256673255f19aecb1a239f6a66096e0b54327cb +size 8602554448 diff --git a/model-00139-of-000163.safetensors b/model-00139-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..965ddc1d4fa166145fecff3b783263b4d1c0c25f --- /dev/null +++ b/model-00139-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d0ef1976a0d3028f55a144ced186d13a5ff3df7e244b7230c2314cd46f4fb97 +size 8598786520 diff --git a/model-00140-of-000163.safetensors b/model-00140-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4d67624529aa535e2120f16fb34327d31cad4fc0 --- /dev/null +++ b/model-00140-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dce9f3404bbca55fc40183fb37edacf0680c2773c432d5b3eadeaba1ba2ae19 +size 8602554408 diff --git a/model-00141-of-000163.safetensors b/model-00141-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f94027ecf0167b17250326d1519bb4d5e487f325 --- /dev/null +++ b/model-00141-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43ee438f657ad0372b33bd30ec2d2a84aab2d1d8a08c47ed96678de80e0f7753 +size 6283123256 diff --git a/model-00142-of-000163.safetensors b/model-00142-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f64fffcea09be5f5606822748756da62d099e194 --- /dev/null +++ b/model-00142-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b93234712b9b76183d252fa9b3a3f7dd74006f65c93bca3ad993ea256165f7d0 +size 8598757608 diff --git a/model-00143-of-000163.safetensors b/model-00143-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4116330bcf571d0e1b736a3e6cf250132a5bac30 --- /dev/null +++ b/model-00143-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba83141fe488918be0ad65863e7ea441494428d7e70919169b93e510cea76af9 +size 8602554424 diff --git a/model-00144-of-000163.safetensors b/model-00144-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2a6dd84530c0bb358340ccc89acd7f765c0cb1f2 --- /dev/null +++ b/model-00144-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2918bfa621e0769901cd9e7686025a7f7c44e974f7ed5d76c357905c379b04b2 +size 8598786704 diff --git a/model-00145-of-000163.safetensors b/model-00145-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..74865fe58b9ea96030839a751ea5adc2f9d0e36f --- /dev/null +++ b/model-00145-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60072e4570b2f6760f14317b42557f00e767c669a3d7b799dfec2a7f81a0d4c8 +size 8602554224 diff --git a/model-00146-of-000163.safetensors b/model-00146-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..31c7ec78c9569d3ef0b4c04c2718bf0950b1b3ce --- /dev/null +++ b/model-00146-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb5450f1cba8d179acef6f1baea46c53ba9b8a09434a642cdd90edbb0e3996b1 +size 8602554448 diff --git a/model-00147-of-000163.safetensors b/model-00147-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..55c59e9cf40d4b8ff22feff745bc01e7116475b0 --- /dev/null +++ b/model-00147-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd25bdb326903c3a001eb395e1a2d2a6297d2b1c54817ad179b2e6ae7327b9a2 +size 8598786608 diff --git a/model-00148-of-000163.safetensors b/model-00148-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b97804921b7094b6162b16caaa112d5ced07bc34 --- /dev/null +++ b/model-00148-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbe3b7e70eba74a2b5ed817d352983ac5565ee13cf277991664258f516021414 +size 8602554320 diff --git a/model-00149-of-000163.safetensors b/model-00149-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..eb95d14e96e4fc53871530ddd30e9ffd178e98f9 --- /dev/null +++ b/model-00149-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:703ab276ef221151ce8e385bcc4d16d0cc8f6e79f6be5acf39d6fd7fd01403fd +size 8602554448 diff --git a/model-00150-of-000163.safetensors b/model-00150-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..935d42a5fba8a21e10d2d4ae8035103a2d565acb --- /dev/null +++ b/model-00150-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33c5d8ba2566d6dbad42e7be54b6b9463581437686d95ba8d07ba30a69234084 +size 8598786504 diff --git a/model-00152-of-000163.safetensors b/model-00152-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4dcdff9ed0b45dd53c90b0ae65e1cdf6db8c5353 --- /dev/null +++ b/model-00152-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53594ed29b9d883689f08a51c5e1c4c705e20c0a8a13868fdd3a3ff575fa2927 +size 8598786704 diff --git a/model-00153-of-000163.safetensors b/model-00153-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b690f6b990abdfff4059eb659fe97f52ebebf1d7 --- /dev/null +++ b/model-00153-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4f9973c00c9c68c924744eacd2bca77f6f9e0810becbb5c4d5fe09d58a489ee +size 8602554224 diff --git a/model-00154-of-000163.safetensors b/model-00154-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..47db09226165a8f46bbe14ee7ad955aef48fe920 --- /dev/null +++ b/model-00154-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21a07dc92d77597a37c69f2060fc9572fe742968a50e68ac42326ad7b249f9c6 +size 8602554448 diff --git a/model-00156-of-000163.safetensors b/model-00156-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ff874128b8ec63c3f1a2d1f051088b1d8a512dd4 --- /dev/null +++ b/model-00156-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0f5e68b01765752cbe7f654250997923005bd22e5babf63ec1bd9a4f805d2ed +size 8602554312 diff --git a/model-00157-of-000163.safetensors b/model-00157-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8121579c5a4565780a2425c26ff2a5e4ed9c6a79 --- /dev/null +++ b/model-00157-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3286d56736c035e16799b3f6d56d8de0264a8fcd3109dfbe115c4b9abb6ee624 +size 8602554448 diff --git a/model-00158-of-000163.safetensors b/model-00158-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0626dcdb93563e969c3ffdff5ab5aea06f0d6b41 --- /dev/null +++ b/model-00158-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3614b3a48478b497e59c1f54d6c1f35a5a9a1ce8c90255c181d13206d147df59 +size 8598786520 diff --git a/model-00159-of-000163.safetensors b/model-00159-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..23a073320fdb31e3cc2114c60c820c5f18220d74 --- /dev/null +++ b/model-00159-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a82ae24c95b4779a1d0281d78626c7de1b8a61a933e7f80d323fbbfbf5afb1f +size 8602554408 diff --git a/model-00161-of-000163.safetensors b/model-00161-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8aac8aa3cc78209bc5a7a85fcffde6b55b29494e --- /dev/null +++ b/model-00161-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:791512e93ec4945ebfc68a00466a6c9f7f5bb336e01c5552c54734db2f85b9ee +size 8602554128 diff --git a/model-00162-of-000163.safetensors b/model-00162-of-000163.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5ad083b30a22eb4dcaefaef146bc07448ca0146e --- /dev/null +++ b/model-00162-of-000163.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2fba41ae0a397444fd749be6193fe88eec63537a0acb7da4a6cb423d17e86d7 +size 8602554440 diff --git a/model.safetensors.index.json b/model.safetensors.index.json new file mode 100644 index 0000000000000000000000000000000000000000..5b60276c1efb766f6a1aee2e357e27407f6ed12b --- /dev/null +++ b/model.safetensors.index.json @@ -0,0 +1,46188 @@ +{ + "metadata": {}, + "weight_map": { + "model.embed_tokens.weight": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.q_a_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.q_a_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.q_b_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.kv_a_proj_with_mqa.weight": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.kv_a_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.kv_b_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.o_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.0.mlp.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.0.mlp.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.0.mlp.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.0.input_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.0.post_attention_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.q_a_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.q_a_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.q_b_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.kv_a_proj_with_mqa.weight": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.kv_a_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.kv_b_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.o_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.1.mlp.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.1.mlp.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.1.mlp.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.1.input_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.1.post_attention_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.q_a_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.q_a_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.q_b_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.kv_a_proj_with_mqa.weight": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.kv_a_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.kv_b_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.o_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.2.mlp.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.2.mlp.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.2.mlp.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.2.input_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.2.post_attention_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.q_a_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.q_a_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.q_b_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.kv_a_proj_with_mqa.weight": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.kv_a_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.kv_b_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.o_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.gate.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.gate.e_score_correction_bias": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.shared_experts.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.shared_experts.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.shared_experts.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.0.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.0.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.0.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.1.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.1.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.1.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.2.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.2.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.2.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.3.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.3.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.3.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.4.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.4.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.4.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.5.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.5.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.5.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.6.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.6.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.6.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.7.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.7.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.7.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.8.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.8.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.8.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.9.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.9.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.9.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.10.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.10.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.10.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.11.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.11.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.11.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.12.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.12.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.12.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.13.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.13.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.13.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.14.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.14.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.14.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.15.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.15.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.15.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.16.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.16.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.16.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.17.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.17.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.17.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.18.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.18.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.18.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.19.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.19.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.19.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.20.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.20.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.20.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.21.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.21.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.21.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.22.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.22.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.22.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.23.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.23.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.23.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.24.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.24.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.24.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.25.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.25.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.25.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.26.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.26.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.26.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.27.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.27.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.27.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.28.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.28.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.28.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.29.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.29.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.29.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.30.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.30.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.30.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.31.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.31.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.31.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.32.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.32.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.32.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.33.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.33.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.33.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.34.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.34.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.34.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.35.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.35.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.35.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.36.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.36.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.36.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.37.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.37.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.37.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.38.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.38.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.38.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.39.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.39.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.39.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.40.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.40.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.40.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.41.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.41.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.41.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.42.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.42.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.42.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.43.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.43.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.43.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.44.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.44.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.44.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.45.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.45.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.45.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.46.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.46.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.46.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.47.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.47.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.47.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.48.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.48.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.48.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.49.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.49.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.49.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.50.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.50.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.50.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.51.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.51.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.51.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.52.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.52.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.52.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.53.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.53.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.53.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.54.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.54.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.54.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.55.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.55.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.55.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.56.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.56.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.56.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.57.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.57.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.57.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.58.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.58.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.58.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.59.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.59.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.59.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.60.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.60.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.60.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.61.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.61.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.61.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.62.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.62.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.62.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.63.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.63.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.63.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.64.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.64.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.64.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.65.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.65.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.65.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.66.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.66.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.66.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.67.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.67.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.67.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.68.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.68.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.68.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.69.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.69.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.69.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.70.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.70.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.70.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.71.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.71.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.71.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.72.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.72.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.72.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.73.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.73.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.73.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.74.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.74.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.74.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.75.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.75.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.75.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.76.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.76.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.76.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.77.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.77.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.77.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.78.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.78.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.78.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.79.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.79.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.79.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.80.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.80.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.80.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.81.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.81.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.81.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.82.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.82.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.82.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.83.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.83.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.83.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.84.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.84.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.84.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.85.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.85.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.85.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.86.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.86.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.86.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.87.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.87.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.87.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.88.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.88.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.88.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.89.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.89.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.89.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.90.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.90.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.90.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.91.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.91.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.91.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.92.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.92.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.92.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.93.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.93.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.93.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.94.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.94.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.94.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.95.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.95.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.95.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.96.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.96.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.96.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.97.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.97.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.97.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.98.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.98.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.98.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.99.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.99.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.99.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.100.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.100.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.100.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.101.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.101.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.101.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.102.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.102.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.102.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.103.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.103.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.103.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.104.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.104.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.104.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.105.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.105.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.105.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.106.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.106.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.106.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.107.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.107.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.107.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.108.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.108.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.108.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.109.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.109.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.109.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.110.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.110.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.110.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.111.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.111.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.111.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.112.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.112.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.112.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.113.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.113.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.113.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.114.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.114.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.114.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.115.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.115.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.115.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.116.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.116.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.116.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.117.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.117.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.117.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.118.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.118.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.118.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.119.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.119.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.119.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.120.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.120.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.120.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.121.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.121.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.121.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.122.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.122.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.122.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.123.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.123.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.123.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.124.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.124.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.124.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.125.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.125.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.125.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.126.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.126.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.126.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.127.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.127.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.127.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.128.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.128.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.128.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.129.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.129.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.129.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.130.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.130.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.130.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.131.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.131.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.131.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.132.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.132.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.132.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.133.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.133.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.133.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.134.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.134.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.134.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.135.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.135.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.135.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.136.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.136.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.136.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.137.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.137.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.137.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.138.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.138.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.138.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.139.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.139.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.139.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.140.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.140.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.140.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.141.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.141.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.141.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.142.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.142.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.142.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.143.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.143.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.143.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.144.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.144.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.144.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.145.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.145.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.145.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.146.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.146.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.146.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.147.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.147.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.147.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.148.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.148.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.148.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.149.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.149.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.149.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.150.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.150.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.150.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.151.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.151.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.151.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.152.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.152.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.152.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.153.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.153.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.153.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.154.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.154.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.154.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.155.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.155.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.155.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.156.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.156.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.156.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.157.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.157.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.157.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.158.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.158.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.158.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.159.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.159.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.159.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.160.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.160.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.160.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.161.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.161.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.161.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.162.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.162.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.162.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.163.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.163.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.163.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.164.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.164.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.164.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.165.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.165.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.165.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.166.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.166.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.166.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.167.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.167.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.167.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.168.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.168.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.168.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.169.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.169.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.169.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.170.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.170.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.170.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.171.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.171.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.171.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.172.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.172.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.172.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.173.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.173.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.173.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.174.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.174.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.174.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.175.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.175.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.175.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.176.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.176.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.176.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.177.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.177.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.177.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.178.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.178.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.178.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.179.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.179.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.179.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.180.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.180.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.180.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.181.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.181.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.181.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.182.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.182.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.182.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.183.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.183.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.183.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.184.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.184.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.184.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.185.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.185.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.185.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.186.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.186.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.186.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.187.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.187.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.187.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.188.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.188.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.188.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.189.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.189.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.189.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.190.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.190.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.190.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.191.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.191.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.191.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.192.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.192.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.192.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.193.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.193.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.193.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.194.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.194.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.194.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.195.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.195.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.195.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.196.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.196.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.196.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.197.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.197.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.197.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.198.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.198.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.198.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.199.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.199.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.199.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.200.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.200.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.200.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.201.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.201.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.201.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.202.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.202.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.202.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.203.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.203.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.203.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.204.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.204.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.204.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.205.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.205.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.205.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.206.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.206.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.206.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.207.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.207.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.207.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.208.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.208.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.208.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.209.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.209.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.209.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.210.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.210.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.210.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.211.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.211.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.211.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.212.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.212.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.212.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.213.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.213.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.213.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.214.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.214.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.214.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.215.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.215.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.215.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.216.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.216.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.216.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.217.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.217.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.217.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.218.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.218.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.218.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.219.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.219.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.219.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.220.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.220.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.220.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.221.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.221.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.221.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.222.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.222.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.222.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.223.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.223.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.223.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.224.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.224.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.224.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.225.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.225.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.225.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.226.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.226.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.226.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.227.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.227.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.227.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.228.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.228.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.228.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.229.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.229.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.229.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.230.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.230.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.230.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.231.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.231.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.231.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.232.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.232.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.232.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.233.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.233.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.233.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.234.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.234.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.234.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.235.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.235.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.235.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.236.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.236.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.236.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.237.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.237.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.237.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.238.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.238.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.238.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.239.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.239.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.239.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.240.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.240.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.240.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.241.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.241.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.241.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.242.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.242.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.242.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.243.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.243.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.243.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.244.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.244.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.244.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.245.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.245.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.245.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.246.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.246.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.246.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.247.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.247.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.247.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.248.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.248.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.248.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.249.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.249.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.249.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.250.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.250.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.250.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.251.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.251.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.251.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.252.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.252.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.252.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.253.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.253.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.253.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.254.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.254.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.254.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.255.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.255.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.255.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.input_layernorm.weight": "model-00004-of-000163.safetensors", + "model.layers.3.post_attention_layernorm.weight": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.q_a_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.q_a_layernorm.weight": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.q_b_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.kv_a_proj_with_mqa.weight": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.kv_a_layernorm.weight": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.kv_b_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.o_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.gate.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.gate.e_score_correction_bias": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.shared_experts.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.shared_experts.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.shared_experts.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.0.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.0.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.0.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.1.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.1.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.1.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.2.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.2.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.2.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.3.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.3.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.3.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.4.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.4.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.4.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.5.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.5.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.5.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.6.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.6.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.6.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.7.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.7.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.7.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.8.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.8.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.8.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.9.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.9.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.9.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.10.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.10.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.10.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.11.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.11.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.11.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.12.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.12.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.12.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.13.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.13.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.13.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.14.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.14.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.14.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.15.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.15.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.15.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.16.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.16.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.16.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.17.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.17.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.17.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.18.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.18.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.18.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.19.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.19.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.19.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.20.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.20.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.20.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.21.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.21.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.21.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.22.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.22.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.22.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.23.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.23.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.23.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.24.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.24.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.24.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.25.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.25.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.25.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.26.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.26.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.26.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.27.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.27.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.27.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.28.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.28.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.28.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.29.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.29.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.29.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.30.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.30.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.30.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.31.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.31.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.31.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.32.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.32.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.32.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.33.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.33.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.33.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.34.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.34.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.34.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.35.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.35.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.35.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.36.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.36.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.36.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.37.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.37.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.37.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.38.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.38.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.38.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.39.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.39.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.39.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.40.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.40.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.40.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.41.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.41.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.41.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.42.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.42.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.42.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.43.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.43.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.43.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.44.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.44.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.44.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.45.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.45.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.45.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.46.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.46.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.46.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.47.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.47.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.47.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.48.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.48.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.48.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.49.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.49.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.49.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.50.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.50.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.50.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.51.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.51.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.51.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.52.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.52.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.52.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.53.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.53.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.53.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.54.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.54.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.54.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.55.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.55.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.55.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.56.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.56.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.56.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.57.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.57.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.57.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.58.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.58.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.58.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.59.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.59.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.59.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.60.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.60.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.60.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.61.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.61.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.61.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.62.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.62.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.62.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.63.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.63.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.63.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.64.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.64.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.64.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.65.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.65.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.65.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.66.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.66.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.66.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.67.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.67.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.67.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.68.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.68.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.68.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.69.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.69.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.69.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.70.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.70.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.70.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.71.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.71.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.71.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.72.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.72.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.72.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.73.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.73.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.73.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.74.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.74.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.74.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.75.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.75.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.75.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.76.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.76.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.76.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.77.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.77.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.77.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.78.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.78.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.78.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.79.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.79.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.79.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.80.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.80.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.80.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.81.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.81.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.81.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.82.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.82.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.82.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.83.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.83.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.83.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.84.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.84.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.84.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.85.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.85.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.85.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.86.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.86.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.86.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.87.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.87.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.87.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.88.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.88.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.88.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.89.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.89.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.89.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.90.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.90.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.90.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.91.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.91.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.91.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.92.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.92.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.92.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.93.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.93.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.93.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.94.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.94.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.94.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.95.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.95.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.95.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.96.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.96.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.96.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.97.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.97.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.97.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.98.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.98.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.98.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.99.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.99.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.99.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.100.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.100.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.100.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.101.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.101.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.101.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.102.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.102.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.102.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.103.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.103.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.103.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.104.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.104.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.104.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.105.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.105.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.105.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.106.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.106.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.106.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.107.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.107.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.107.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.108.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.108.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.108.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.109.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.109.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.109.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.110.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.110.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.110.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.111.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.111.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.111.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.112.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.112.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.112.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.113.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.113.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.113.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.114.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.114.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.114.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.115.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.115.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.115.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.116.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.116.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.116.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.117.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.117.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.117.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.118.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.118.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.118.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.119.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.119.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.119.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.120.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.120.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.120.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.121.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.121.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.121.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.122.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.122.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.122.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.123.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.123.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.123.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.124.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.124.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.124.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.125.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.125.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.125.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.126.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.126.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.126.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.127.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.127.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.127.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.128.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.128.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.128.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.129.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.129.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.129.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.130.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.130.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.130.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.131.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.131.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.131.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.132.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.132.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.132.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.133.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.133.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.133.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.134.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.134.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.134.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.135.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.135.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.135.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.136.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.136.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.136.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.137.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.137.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.137.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.138.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.138.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.138.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.139.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.139.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.139.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.140.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.140.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.140.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.141.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.141.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.141.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.142.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.142.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.142.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.143.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.143.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.143.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.144.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.144.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.144.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.145.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.145.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.145.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.146.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.146.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.146.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.147.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.147.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.147.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.148.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.148.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.148.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.149.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.149.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.149.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.150.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.150.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.150.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.151.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.151.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.151.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.152.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.152.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.152.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.153.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.153.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.153.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.154.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.154.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.154.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.155.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.155.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.155.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.156.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.156.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.156.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.157.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.157.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.157.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.158.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.158.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.158.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.159.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.159.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.159.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.160.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.160.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.160.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.161.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.161.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.161.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.162.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.162.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.162.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.163.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.163.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.163.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.164.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.164.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.164.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.165.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.165.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.165.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.166.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.166.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.166.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.167.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.167.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.167.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.168.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.168.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.168.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.169.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.169.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.169.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.170.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.170.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.170.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.171.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.171.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.171.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.172.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.172.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.172.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.173.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.173.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.173.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.174.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.174.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.174.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.175.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.175.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.175.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.176.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.176.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.176.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.177.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.177.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.177.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.178.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.178.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.178.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.179.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.179.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.179.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.180.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.180.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.180.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.181.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.181.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.181.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.182.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.182.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.182.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.183.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.183.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.183.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.184.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.184.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.184.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.185.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.185.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.185.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.186.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.186.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.186.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.187.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.187.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.187.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.188.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.188.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.188.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.189.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.189.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.189.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.190.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.190.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.190.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.191.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.191.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.191.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.192.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.192.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.192.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.193.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.193.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.193.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.194.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.194.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.194.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.195.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.195.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.195.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.196.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.196.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.196.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.197.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.197.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.197.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.198.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.198.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.198.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.199.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.199.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.199.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.200.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.200.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.200.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.201.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.201.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.201.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.202.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.202.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.202.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.203.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.203.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.203.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.204.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.204.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.204.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.205.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.205.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.205.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.206.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.206.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.206.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.207.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.207.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.207.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.208.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.208.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.208.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.209.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.209.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.209.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.210.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.210.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.210.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.211.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.211.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.211.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.212.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.212.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.212.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.213.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.213.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.213.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.214.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.214.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.214.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.215.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.215.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.215.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.216.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.216.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.216.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.217.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.217.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.217.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.218.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.218.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.218.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.219.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.219.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.219.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.220.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.220.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.220.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.221.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.221.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.221.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.222.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.222.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.222.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.223.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.223.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.223.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.224.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.224.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.224.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.225.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.225.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.225.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.226.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.226.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.226.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.227.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.227.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.227.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.228.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.228.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.228.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.229.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.229.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.229.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.230.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.230.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.230.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.231.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.231.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.231.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.232.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.232.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.232.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.233.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.233.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.233.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.234.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.234.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.234.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.235.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.235.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.235.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.236.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.236.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.236.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.237.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.237.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.237.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.238.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.238.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.238.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.239.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.239.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.239.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.240.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.240.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.240.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.241.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.241.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.241.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.242.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.242.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.242.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.243.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.243.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.243.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.244.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.244.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.244.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.245.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.245.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.245.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.246.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.246.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.246.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.247.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.247.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.247.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.248.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.248.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.248.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.249.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.249.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.249.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.250.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.250.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.250.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.251.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.251.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.251.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.252.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.252.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.252.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.253.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.253.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.253.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.254.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.254.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.254.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.255.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.255.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.255.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.input_layernorm.weight": "model-00006-of-000163.safetensors", + "model.layers.4.post_attention_layernorm.weight": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.q_a_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.q_a_layernorm.weight": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.q_b_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.kv_a_proj_with_mqa.weight": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.kv_a_layernorm.weight": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.kv_b_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.o_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.5.mlp.gate.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.gate.e_score_correction_bias": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.shared_experts.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.shared_experts.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.shared_experts.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.0.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.0.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.0.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.1.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.1.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.1.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.2.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.2.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.2.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.3.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.3.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.3.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.4.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.4.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.4.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.5.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.5.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.5.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.6.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.6.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.6.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.7.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.7.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.7.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.8.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.8.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.8.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.9.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.9.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.9.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.10.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.10.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.10.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.11.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.11.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.11.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.12.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.12.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.12.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.13.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.13.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.13.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.14.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.14.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.14.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.15.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.15.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.15.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.16.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.16.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.16.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.17.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.17.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.17.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.18.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.18.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.18.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.19.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.19.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.19.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.20.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.20.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.20.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.21.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.21.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.21.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.22.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.22.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.22.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.23.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.23.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.23.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.24.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.24.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.24.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.25.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.25.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.25.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.26.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.26.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.26.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.27.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.27.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.27.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.28.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.28.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.28.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.29.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.29.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.29.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.30.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.30.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.30.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.31.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.31.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.31.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.32.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.32.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.32.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.33.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.33.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.33.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.34.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.34.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.34.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.35.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.35.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.35.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.36.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.36.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.36.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.37.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.37.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.37.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.38.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.38.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.38.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.39.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.39.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.39.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.40.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.40.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.40.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.41.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.41.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.41.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.42.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.42.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.42.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.43.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.43.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.43.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.44.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.44.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.44.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.45.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.45.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.45.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.46.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.46.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.46.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.47.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.47.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.47.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.48.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.48.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.48.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.49.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.49.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.49.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.50.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.50.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.50.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.51.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.51.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.51.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.52.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.52.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.52.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.53.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.53.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.53.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.54.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.54.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.54.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.55.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.55.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.55.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.56.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.56.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.56.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.57.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.57.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.57.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.58.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.58.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.58.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.59.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.59.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.59.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.60.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.60.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.60.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.61.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.61.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.61.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.62.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.62.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.62.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.63.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.63.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.63.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.64.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.64.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.64.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.65.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.65.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.65.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.66.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.66.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.66.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.67.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.67.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.67.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.68.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.68.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.68.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.69.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.69.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.69.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.70.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.70.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.70.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.71.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.71.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.71.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.72.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.72.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.72.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.73.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.73.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.73.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.74.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.74.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.74.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.75.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.75.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.75.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.76.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.76.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.76.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.77.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.77.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.77.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.78.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.78.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.78.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.79.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.79.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.79.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.80.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.80.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.80.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.81.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.81.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.81.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.82.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.82.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.82.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.83.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.83.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.83.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.84.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.84.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.84.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.85.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.85.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.85.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.86.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.86.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.86.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.87.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.87.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.87.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.88.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.88.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.88.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.89.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.89.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.89.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.90.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.90.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.90.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.91.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.91.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.91.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.92.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.92.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.92.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.93.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.93.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.93.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.94.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.94.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.94.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.95.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.95.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.95.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.96.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.96.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.96.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.97.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.97.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.97.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.98.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.98.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.98.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.99.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.99.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.99.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.100.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.100.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.100.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.101.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.101.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.101.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.102.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.102.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.102.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.103.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.103.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.103.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.104.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.104.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.104.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.105.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.105.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.105.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.106.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.106.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.106.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.107.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.107.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.107.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.108.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.108.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.108.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.109.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.109.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.109.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.110.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.110.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.110.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.111.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.111.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.111.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.112.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.112.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.112.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.113.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.113.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.113.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.114.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.114.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.114.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.115.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.115.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.115.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.116.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.116.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.116.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.117.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.117.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.117.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.118.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.118.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.118.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.119.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.119.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.119.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.120.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.120.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.120.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.121.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.121.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.121.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.122.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.122.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.122.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.123.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.123.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.123.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.124.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.124.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.124.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.125.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.125.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.125.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.126.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.126.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.126.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.127.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.127.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.127.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.128.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.128.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.128.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.129.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.129.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.129.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.130.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.130.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.130.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.131.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.131.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.131.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.132.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.132.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.132.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.133.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.133.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.133.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.134.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.134.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.134.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.135.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.135.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.135.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.136.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.136.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.136.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.137.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.137.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.137.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.138.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.138.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.138.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.139.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.139.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.139.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.140.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.140.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.140.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.141.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.141.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.141.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.142.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.142.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.142.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.143.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.143.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.143.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.144.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.144.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.144.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.145.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.145.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.145.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.146.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.146.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.146.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.147.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.147.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.147.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.148.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.148.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.148.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.149.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.149.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.149.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.150.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.150.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.150.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.151.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.151.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.151.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.152.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.152.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.152.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.153.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.153.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.153.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.154.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.154.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.154.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.155.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.155.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.155.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.156.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.156.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.156.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.157.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.157.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.157.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.158.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.158.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.158.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.159.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.159.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.159.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.160.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.160.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.160.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.161.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.161.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.161.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.162.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.162.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.162.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.163.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.163.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.163.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.164.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.164.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.164.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.165.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.165.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.165.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.166.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.166.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.166.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.167.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.167.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.167.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.168.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.168.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.168.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.169.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.169.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.169.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.170.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.170.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.170.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.171.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.171.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.171.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.172.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.172.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.172.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.173.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.173.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.173.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.174.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.174.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.174.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.175.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.175.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.175.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.176.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.176.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.176.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.177.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.177.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.177.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.178.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.178.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.178.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.179.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.179.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.179.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.180.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.180.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.180.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.181.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.181.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.181.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.182.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.182.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.182.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.183.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.183.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.183.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.184.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.184.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.184.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.185.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.185.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.185.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.186.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.186.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.186.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.187.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.187.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.187.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.188.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.188.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.188.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.189.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.189.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.189.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.190.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.190.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.190.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.191.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.191.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.191.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.192.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.192.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.192.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.193.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.193.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.193.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.194.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.194.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.194.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.195.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.195.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.195.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.196.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.196.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.196.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.197.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.197.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.197.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.198.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.198.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.198.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.199.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.199.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.199.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.200.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.200.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.200.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.201.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.201.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.201.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.202.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.202.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.202.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.203.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.203.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.203.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.204.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.204.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.204.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.205.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.205.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.205.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.206.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.206.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.206.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.207.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.207.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.207.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.208.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.208.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.208.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.209.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.209.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.209.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.210.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.210.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.210.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.211.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.211.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.211.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.212.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.212.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.212.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.213.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.213.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.213.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.214.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.214.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.214.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.215.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.215.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.215.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.216.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.216.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.216.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.217.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.217.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.217.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.218.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.218.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.218.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.219.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.219.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.219.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.220.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.220.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.220.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.221.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.221.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.221.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.222.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.222.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.222.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.223.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.223.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.223.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.224.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.224.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.224.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.225.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.225.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.225.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.226.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.226.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.226.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.227.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.227.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.227.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.228.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.228.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.228.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.229.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.229.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.229.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.230.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.230.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.230.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.231.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.231.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.231.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.232.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.232.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.232.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.233.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.233.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.233.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.234.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.234.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.234.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.235.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.235.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.235.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.236.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.236.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.236.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.237.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.237.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.237.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.238.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.238.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.238.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.239.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.239.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.239.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.240.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.240.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.240.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.241.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.241.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.241.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.242.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.242.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.242.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.243.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.243.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.243.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.244.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.244.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.244.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.245.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.245.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.245.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.246.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.246.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.246.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.247.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.247.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.247.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.248.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.248.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.248.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.249.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.249.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.249.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.250.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.250.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.250.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.251.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.251.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.251.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.252.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.252.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.252.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.253.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.253.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.253.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.254.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.254.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.254.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.255.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.255.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.255.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.input_layernorm.weight": "model-00009-of-000163.safetensors", + "model.layers.5.post_attention_layernorm.weight": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.q_a_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.q_a_layernorm.weight": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.q_b_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.kv_a_proj_with_mqa.weight": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.kv_a_layernorm.weight": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.kv_b_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.o_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.gate.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.gate.e_score_correction_bias": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.shared_experts.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.shared_experts.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.shared_experts.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.0.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.0.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.0.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.1.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.1.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.1.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.2.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.2.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.2.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.3.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.3.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.3.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.4.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.4.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.4.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.5.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.5.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.5.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.6.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.6.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.6.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.7.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.7.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.7.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.8.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.8.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.8.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.9.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.9.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.9.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.10.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.10.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.10.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.11.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.11.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.11.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.12.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.12.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.12.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.13.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.13.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.13.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.14.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.14.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.14.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.15.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.15.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.15.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.16.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.16.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.16.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.17.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.17.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.17.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.18.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.18.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.18.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.19.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.19.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.19.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.20.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.20.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.20.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.21.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.21.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.21.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.22.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.22.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.22.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.23.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.23.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.23.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.24.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.24.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.24.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.25.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.25.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.25.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.26.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.26.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.26.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.27.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.27.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.27.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.28.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.28.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.28.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.29.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.29.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.29.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.30.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.30.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.30.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.31.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.31.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.31.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.32.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.32.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.32.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.33.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.33.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.33.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.34.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.34.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.34.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.35.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.35.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.35.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.36.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.36.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.36.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.37.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.37.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.37.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.38.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.38.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.38.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.39.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.39.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.39.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.40.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.40.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.40.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.41.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.41.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.41.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.42.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.42.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.42.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.43.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.43.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.43.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.44.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.44.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.44.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.45.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.45.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.45.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.46.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.46.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.46.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.47.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.47.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.47.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.48.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.48.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.48.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.49.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.49.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.49.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.50.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.50.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.50.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.51.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.51.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.51.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.52.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.52.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.52.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.53.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.53.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.53.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.54.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.54.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.54.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.55.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.55.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.55.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.56.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.56.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.56.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.57.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.57.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.57.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.58.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.58.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.58.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.59.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.59.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.59.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.60.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.60.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.60.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.61.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.61.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.61.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.62.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.62.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.62.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.63.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.63.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.63.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.64.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.64.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.64.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.65.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.65.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.65.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.66.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.66.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.66.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.67.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.67.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.67.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.68.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.68.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.68.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.69.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.69.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.69.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.70.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.70.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.70.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.71.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.71.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.71.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.72.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.72.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.72.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.73.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.73.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.73.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.74.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.74.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.74.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.75.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.75.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.75.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.76.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.76.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.76.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.77.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.77.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.77.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.78.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.78.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.78.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.79.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.79.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.79.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.80.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.80.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.80.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.81.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.81.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.81.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.82.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.82.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.82.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.83.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.83.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.83.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.84.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.84.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.84.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.85.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.85.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.85.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.86.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.86.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.86.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.87.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.87.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.87.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.88.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.88.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.88.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.89.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.89.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.89.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.90.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.90.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.90.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.91.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.91.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.91.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.92.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.92.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.92.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.93.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.93.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.93.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.94.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.94.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.94.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.95.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.95.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.95.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.96.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.96.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.96.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.97.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.97.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.97.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.98.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.98.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.98.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.99.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.99.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.99.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.100.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.100.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.100.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.101.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.101.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.101.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.102.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.102.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.102.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.103.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.103.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.103.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.104.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.104.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.104.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.105.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.105.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.105.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.106.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.106.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.106.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.107.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.107.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.107.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.108.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.108.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.108.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.109.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.109.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.109.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.110.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.110.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.110.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.111.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.111.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.111.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.112.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.112.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.112.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.113.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.113.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.113.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.114.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.114.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.114.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.115.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.115.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.115.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.116.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.116.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.116.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.117.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.117.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.117.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.118.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.118.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.118.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.119.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.119.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.119.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.120.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.120.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.120.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.121.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.121.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.121.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.122.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.122.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.122.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.123.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.123.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.123.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.124.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.124.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.124.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.125.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.125.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.125.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.126.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.126.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.126.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.127.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.127.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.127.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.128.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.128.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.128.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.129.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.129.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.129.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.130.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.130.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.130.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.131.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.131.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.131.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.132.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.132.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.132.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.133.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.133.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.133.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.134.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.134.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.134.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.135.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.135.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.135.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.136.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.136.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.136.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.137.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.137.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.137.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.138.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.138.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.138.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.139.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.139.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.139.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.140.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.140.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.140.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.141.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.141.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.141.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.142.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.142.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.142.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.143.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.143.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.143.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.144.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.144.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.144.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.145.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.145.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.145.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.146.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.146.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.146.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.147.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.147.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.147.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.148.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.148.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.148.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.149.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.149.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.149.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.150.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.150.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.150.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.151.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.151.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.151.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.152.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.152.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.152.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.153.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.153.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.153.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.154.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.154.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.154.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.155.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.155.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.155.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.156.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.156.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.156.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.157.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.157.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.157.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.158.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.158.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.158.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.159.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.159.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.159.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.160.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.160.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.160.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.161.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.161.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.161.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.162.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.162.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.162.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.163.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.163.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.163.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.164.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.164.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.164.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.165.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.165.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.165.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.166.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.166.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.166.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.167.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.167.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.167.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.168.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.168.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.168.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.169.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.169.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.169.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.170.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.170.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.170.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.171.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.171.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.171.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.172.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.172.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.172.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.173.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.173.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.173.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.174.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.174.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.174.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.175.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.175.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.175.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.176.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.176.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.176.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.177.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.177.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.177.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.178.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.178.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.178.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.179.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.179.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.179.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.180.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.180.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.180.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.181.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.181.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.181.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.182.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.182.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.182.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.183.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.183.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.183.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.184.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.184.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.184.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.185.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.185.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.185.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.186.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.186.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.186.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.187.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.187.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.187.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.188.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.188.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.188.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.189.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.189.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.189.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.190.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.190.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.190.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.191.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.191.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.191.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.192.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.192.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.192.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.193.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.193.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.193.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.194.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.194.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.194.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.195.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.195.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.195.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.196.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.196.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.196.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.197.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.197.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.197.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.198.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.198.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.198.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.199.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.199.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.199.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.200.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.200.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.200.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.201.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.201.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.201.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.202.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.202.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.202.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.203.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.203.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.203.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.204.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.204.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.204.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.205.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.205.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.205.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.206.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.206.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.206.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.207.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.207.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.207.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.208.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.208.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.208.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.209.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.209.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.209.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.210.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.210.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.210.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.211.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.211.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.211.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.212.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.212.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.212.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.213.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.213.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.213.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.214.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.214.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.214.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.215.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.215.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.215.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.216.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.216.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.216.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.217.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.217.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.217.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.218.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.218.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.218.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.219.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.219.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.219.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.220.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.220.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.220.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.221.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.221.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.221.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.222.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.222.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.222.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.223.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.223.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.223.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.224.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.224.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.224.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.225.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.225.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.225.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.226.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.226.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.226.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.227.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.227.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.227.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.228.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.228.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.228.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.229.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.229.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.229.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.230.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.230.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.230.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.231.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.231.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.231.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.232.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.232.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.232.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.233.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.233.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.233.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.234.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.234.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.234.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.235.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.235.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.235.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.236.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.236.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.236.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.237.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.237.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.237.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.238.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.238.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.238.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.239.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.239.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.239.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.240.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.240.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.240.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.241.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.241.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.241.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.242.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.242.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.242.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.243.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.243.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.243.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.244.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.244.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.244.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.245.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.245.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.245.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.246.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.246.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.246.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.247.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.247.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.247.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.248.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.248.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.248.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.249.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.249.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.249.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.250.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.250.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.250.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.251.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.251.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.251.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.252.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.252.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.252.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.253.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.253.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.253.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.254.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.254.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.254.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.255.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.255.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.255.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.input_layernorm.weight": "model-00012-of-000163.safetensors", + "model.layers.6.post_attention_layernorm.weight": "model-00012-of-000163.safetensors", + "model.layers.7.self_attn.q_a_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.self_attn.q_a_layernorm.weight": "model-00013-of-000163.safetensors", + "model.layers.7.self_attn.q_b_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.self_attn.kv_a_proj_with_mqa.weight": "model-00013-of-000163.safetensors", + "model.layers.7.self_attn.kv_a_layernorm.weight": "model-00013-of-000163.safetensors", + "model.layers.7.self_attn.kv_b_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.self_attn.o_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.gate.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.gate.e_score_correction_bias": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.shared_experts.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.shared_experts.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.shared_experts.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.0.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.0.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.0.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.1.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.1.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.1.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.2.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.2.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.2.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.3.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.3.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.3.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.4.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.4.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.4.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.5.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.5.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.5.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.6.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.6.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.6.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.7.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.7.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.7.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.8.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.8.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.8.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.9.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.9.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.9.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.10.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.10.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.10.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.11.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.11.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.11.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.12.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.12.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.12.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.13.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.13.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.13.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.14.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.14.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.14.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.15.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.15.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.15.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.16.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.16.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.16.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.17.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.17.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.17.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.18.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.18.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.18.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.19.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.19.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.19.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.20.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.20.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.20.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.21.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.21.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.21.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.22.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.22.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.22.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.23.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.23.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.23.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.24.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.24.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.24.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.25.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.25.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.25.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.26.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.26.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.26.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.27.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.27.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.27.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.28.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.28.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.28.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.29.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.29.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.29.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.30.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.30.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.30.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.31.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.31.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.31.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.32.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.32.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.32.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.33.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.33.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.33.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.34.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.34.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.34.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.35.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.35.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.35.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.36.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.36.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.36.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.37.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.37.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.37.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.38.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.38.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.38.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.39.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.39.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.39.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.40.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.40.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.40.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.41.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.41.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.41.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.42.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.42.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.42.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.43.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.43.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.43.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.44.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.44.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.44.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.45.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.45.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.45.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.46.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.46.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.46.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.47.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.47.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.47.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.48.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.48.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.48.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.49.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.49.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.49.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.50.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.50.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.50.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.51.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.51.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.51.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.52.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.52.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.52.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.53.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.53.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.53.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.54.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.54.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.54.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.55.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.55.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.55.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.56.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.56.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.56.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.57.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.57.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.57.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.58.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.58.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.58.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.59.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.59.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.59.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.60.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.60.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.60.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.61.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.61.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.61.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.62.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.62.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.62.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.63.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.63.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.63.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.64.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.64.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.64.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.65.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.65.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.65.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.66.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.66.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.66.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.67.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.67.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.67.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.68.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.68.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.68.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.69.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.69.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.69.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.70.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.70.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.70.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.71.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.71.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.71.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.72.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.72.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.72.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.73.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.73.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.73.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.74.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.74.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.74.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.75.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.75.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.75.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.76.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.76.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.76.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.77.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.77.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.77.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.78.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.78.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.78.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.79.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.79.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.79.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.80.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.80.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.80.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.81.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.81.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.81.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.82.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.82.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.82.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.83.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.83.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.83.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.84.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.84.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.84.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.85.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.85.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.85.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.86.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.86.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.86.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.87.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.87.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.87.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.88.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.88.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.88.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.89.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.89.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.89.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.90.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.90.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.90.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.91.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.91.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.91.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.92.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.92.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.92.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.93.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.93.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.93.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.94.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.94.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.94.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.95.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.95.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.95.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.96.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.96.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.96.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.97.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.97.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.97.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.98.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.98.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.98.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.99.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.99.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.99.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.100.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.100.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.100.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.101.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.101.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.101.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.102.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.102.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.102.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.103.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.103.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.103.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.104.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.104.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.104.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.105.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.105.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.105.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.106.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.106.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.106.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.107.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.107.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.107.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.108.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.108.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.108.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.109.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.109.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.109.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.110.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.110.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.110.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.111.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.111.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.111.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.112.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.112.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.112.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.113.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.113.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.113.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.114.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.114.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.114.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.115.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.115.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.115.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.116.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.116.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.116.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.117.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.117.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.117.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.118.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.118.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.118.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.119.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.119.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.119.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.120.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.120.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.120.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.121.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.121.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.121.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.122.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.122.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.122.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.123.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.123.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.123.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.124.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.124.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.124.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.125.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.125.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.125.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.126.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.126.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.126.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.127.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.127.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.127.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.128.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.128.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.128.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.129.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.129.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.129.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.130.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.130.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.130.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.131.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.131.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.131.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.132.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.132.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.132.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.133.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.133.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.133.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.134.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.134.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.134.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.135.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.135.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.135.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.136.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.136.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.136.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.137.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.137.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.137.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.138.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.138.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.138.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.139.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.139.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.139.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.140.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.140.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.140.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.141.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.141.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.141.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.142.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.142.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.142.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.143.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.143.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.143.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.144.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.144.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.144.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.145.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.145.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.145.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.146.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.146.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.146.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.147.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.147.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.147.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.148.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.148.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.148.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.149.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.149.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.149.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.150.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.150.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.150.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.151.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.151.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.151.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.152.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.152.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.152.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.153.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.153.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.153.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.154.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.154.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.154.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.155.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.155.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.155.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.156.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.156.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.156.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.157.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.157.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.157.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.158.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.158.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.158.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.159.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.159.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.159.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.160.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.160.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.160.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.161.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.161.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.161.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.162.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.162.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.162.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.163.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.163.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.163.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.164.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.164.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.164.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.165.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.165.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.165.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.166.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.166.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.166.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.167.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.167.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.167.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.168.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.168.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.168.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.169.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.169.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.169.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.170.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.170.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.170.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.171.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.171.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.171.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.172.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.172.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.172.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.173.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.173.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.173.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.174.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.174.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.174.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.175.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.175.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.175.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.176.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.176.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.176.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.177.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.177.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.177.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.178.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.178.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.178.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.179.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.179.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.179.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.180.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.180.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.180.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.181.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.181.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.181.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.182.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.182.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.182.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.183.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.183.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.183.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.184.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.184.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.184.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.185.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.185.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.185.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.186.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.186.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.186.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.187.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.187.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.187.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.188.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.188.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.188.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.189.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.189.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.189.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.190.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.190.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.190.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.191.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.191.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.191.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.192.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.192.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.192.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.193.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.193.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.193.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.194.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.194.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.194.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.195.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.195.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.195.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.196.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.196.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.196.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.197.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.197.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.197.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.198.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.198.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.198.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.199.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.199.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.199.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.200.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.200.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.200.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.201.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.201.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.201.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.202.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.202.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.202.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.203.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.203.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.203.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.204.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.204.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.204.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.205.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.205.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.205.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.206.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.206.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.206.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.207.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.207.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.207.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.208.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.208.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.208.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.209.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.209.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.209.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.210.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.210.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.210.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.211.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.211.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.211.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.212.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.212.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.212.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.213.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.213.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.213.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.214.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.214.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.214.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.215.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.215.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.215.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.216.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.216.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.216.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.217.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.217.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.217.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.218.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.218.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.218.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.219.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.219.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.219.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.220.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.220.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.220.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.221.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.221.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.221.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.222.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.222.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.222.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.223.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.223.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.223.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.224.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.224.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.224.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.225.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.225.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.225.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.226.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.226.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.226.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.227.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.227.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.227.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.228.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.228.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.228.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.229.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.229.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.229.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.230.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.230.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.230.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.231.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.231.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.231.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.232.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.232.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.232.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.233.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.233.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.233.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.234.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.234.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.234.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.235.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.235.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.235.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.236.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.236.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.236.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.237.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.237.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.237.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.238.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.238.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.238.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.239.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.239.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.239.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.240.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.240.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.240.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.241.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.241.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.241.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.242.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.242.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.242.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.243.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.243.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.243.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.244.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.244.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.244.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.245.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.245.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.245.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.246.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.246.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.246.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.247.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.247.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.247.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.248.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.248.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.248.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.249.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.249.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.249.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.250.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.250.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.250.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.251.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.251.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.251.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.252.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.252.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.252.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.253.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.253.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.253.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.254.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.254.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.254.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.255.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.255.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.255.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.input_layernorm.weight": "model-00015-of-000163.safetensors", + "model.layers.7.post_attention_layernorm.weight": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.q_a_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.q_a_layernorm.weight": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.q_b_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.kv_a_proj_with_mqa.weight": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.kv_a_layernorm.weight": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.kv_b_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.o_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.gate.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.gate.e_score_correction_bias": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.shared_experts.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.shared_experts.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.shared_experts.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.0.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.0.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.0.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.1.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.1.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.1.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.2.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.2.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.2.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.3.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.3.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.3.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.4.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.4.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.4.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.5.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.5.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.5.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.6.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.6.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.6.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.7.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.7.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.7.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.8.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.8.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.8.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.9.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.9.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.9.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.10.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.10.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.10.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.11.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.11.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.11.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.12.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.12.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.12.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.13.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.13.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.13.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.14.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.14.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.14.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.15.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.15.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.15.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.16.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.16.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.16.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.17.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.17.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.17.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.18.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.18.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.18.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.19.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.19.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.19.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.20.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.20.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.20.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.21.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.21.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.21.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.22.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.22.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.22.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.23.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.23.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.23.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.24.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.24.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.24.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.25.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.25.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.25.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.26.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.26.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.26.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.27.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.27.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.27.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.28.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.28.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.28.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.29.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.29.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.29.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.30.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.30.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.30.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.31.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.31.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.31.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.32.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.32.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.32.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.33.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.33.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.33.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.34.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.34.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.34.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.35.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.35.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.35.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.36.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.36.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.36.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.37.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.37.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.37.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.38.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.38.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.38.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.39.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.39.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.39.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.40.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.40.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.40.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.41.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.41.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.41.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.42.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.42.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.42.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.43.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.43.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.43.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.44.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.44.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.44.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.45.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.45.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.45.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.46.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.46.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.46.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.47.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.47.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.47.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.48.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.48.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.48.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.49.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.49.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.49.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.50.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.50.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.50.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.51.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.51.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.51.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.52.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.52.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.52.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.53.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.53.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.53.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.54.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.54.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.54.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.55.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.55.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.55.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.56.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.56.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.56.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.57.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.57.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.57.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.58.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.58.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.58.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.59.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.59.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.59.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.60.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.60.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.60.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.61.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.61.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.61.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.62.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.62.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.62.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.63.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.63.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.63.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.64.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.64.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.64.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.65.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.65.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.65.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.66.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.66.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.66.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.67.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.67.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.67.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.68.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.68.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.68.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.69.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.69.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.69.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.70.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.70.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.70.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.71.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.71.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.71.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.72.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.72.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.72.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.73.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.73.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.73.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.74.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.74.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.74.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.75.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.75.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.75.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.76.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.76.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.76.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.77.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.77.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.77.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.78.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.78.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.78.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.79.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.79.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.79.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.80.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.80.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.80.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.81.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.81.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.81.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.82.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.82.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.82.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.83.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.83.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.83.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.84.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.84.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.84.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.85.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.85.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.85.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.86.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.86.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.86.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.87.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.87.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.87.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.88.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.88.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.88.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.89.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.89.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.89.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.90.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.90.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.90.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.91.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.91.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.91.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.92.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.92.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.92.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.93.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.93.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.93.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.94.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.94.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.94.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.95.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.95.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.95.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.96.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.96.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.96.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.97.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.97.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.97.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.98.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.98.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.98.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.99.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.99.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.99.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.100.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.100.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.100.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.101.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.101.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.101.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.102.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.102.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.102.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.103.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.103.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.103.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.104.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.104.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.104.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.105.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.105.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.105.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.106.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.106.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.106.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.107.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.107.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.107.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.108.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.108.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.108.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.109.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.109.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.109.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.110.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.110.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.110.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.111.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.111.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.111.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.112.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.112.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.112.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.113.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.113.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.113.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.114.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.114.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.114.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.115.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.115.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.115.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.116.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.116.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.116.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.117.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.117.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.117.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.118.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.118.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.118.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.119.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.119.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.119.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.120.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.120.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.120.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.121.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.121.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.121.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.122.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.122.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.122.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.123.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.123.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.123.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.124.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.124.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.124.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.125.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.125.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.125.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.126.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.126.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.126.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.127.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.127.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.127.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.128.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.128.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.128.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.129.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.129.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.129.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.130.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.130.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.130.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.131.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.131.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.131.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.132.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.132.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.132.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.133.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.133.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.133.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.134.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.134.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.134.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.135.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.135.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.135.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.136.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.136.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.136.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.137.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.137.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.137.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.138.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.138.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.138.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.139.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.139.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.139.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.140.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.140.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.140.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.141.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.141.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.141.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.142.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.142.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.142.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.143.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.143.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.143.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.144.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.144.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.144.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.145.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.145.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.145.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.146.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.146.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.146.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.147.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.147.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.147.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.148.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.148.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.148.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.149.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.149.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.149.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.150.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.150.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.150.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.151.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.151.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.151.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.152.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.152.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.152.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.153.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.153.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.153.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.154.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.154.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.154.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.155.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.155.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.155.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.156.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.156.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.156.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.157.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.157.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.157.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.158.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.158.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.158.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.159.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.159.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.159.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.160.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.160.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.160.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.161.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.161.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.161.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.162.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.162.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.162.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.163.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.163.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.163.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.164.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.164.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.164.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.165.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.165.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.165.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.166.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.166.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.166.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.167.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.167.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.167.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.168.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.168.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.168.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.169.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.169.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.169.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.170.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.170.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.170.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.171.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.171.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.171.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.172.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.172.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.172.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.173.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.173.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.173.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.174.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.174.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.174.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.175.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.175.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.175.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.176.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.176.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.176.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.177.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.177.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.177.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.178.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.178.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.178.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.179.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.179.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.179.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.180.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.180.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.180.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.181.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.181.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.181.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.182.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.182.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.182.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.183.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.183.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.183.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.184.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.184.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.184.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.185.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.185.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.185.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.186.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.186.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.186.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.187.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.187.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.187.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.188.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.188.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.188.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.189.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.189.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.189.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.190.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.190.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.190.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.191.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.191.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.191.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.192.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.192.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.192.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.193.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.193.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.193.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.194.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.194.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.194.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.195.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.195.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.195.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.196.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.196.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.196.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.197.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.197.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.197.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.198.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.198.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.198.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.199.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.199.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.199.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.200.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.200.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.200.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.201.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.201.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.201.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.202.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.202.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.202.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.203.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.203.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.203.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.204.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.204.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.204.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.205.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.205.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.205.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.206.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.206.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.206.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.207.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.207.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.207.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.208.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.208.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.208.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.209.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.209.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.209.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.210.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.210.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.210.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.211.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.211.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.211.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.212.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.212.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.212.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.213.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.213.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.213.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.214.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.214.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.214.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.215.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.215.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.215.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.216.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.216.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.216.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.217.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.217.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.217.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.218.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.218.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.218.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.219.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.219.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.219.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.220.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.220.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.220.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.221.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.221.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.221.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.222.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.222.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.222.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.223.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.223.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.223.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.224.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.224.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.224.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.225.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.225.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.225.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.226.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.226.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.226.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.227.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.227.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.227.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.228.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.228.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.228.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.229.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.229.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.229.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.230.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.230.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.230.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.231.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.231.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.231.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.232.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.232.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.232.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.233.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.233.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.233.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.234.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.234.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.234.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.235.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.235.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.235.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.236.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.236.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.236.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.237.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.237.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.237.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.238.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.238.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.238.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.239.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.239.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.239.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.240.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.240.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.240.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.241.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.241.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.241.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.242.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.242.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.242.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.243.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.243.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.243.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.244.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.244.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.244.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.245.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.245.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.245.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.246.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.246.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.246.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.247.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.247.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.247.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.248.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.248.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.248.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.249.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.249.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.249.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.250.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.250.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.250.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.251.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.251.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.251.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.252.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.252.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.252.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.253.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.253.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.253.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.254.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.254.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.254.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.255.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.255.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.255.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.input_layernorm.weight": "model-00018-of-000163.safetensors", + "model.layers.8.post_attention_layernorm.weight": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.q_a_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.q_a_layernorm.weight": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.q_b_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.kv_a_proj_with_mqa.weight": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.kv_a_layernorm.weight": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.kv_b_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.o_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.gate.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.gate.e_score_correction_bias": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.shared_experts.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.shared_experts.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.shared_experts.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.0.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.0.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.0.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.1.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.1.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.1.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.2.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.2.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.2.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.3.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.3.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.3.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.4.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.4.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.4.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.5.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.5.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.5.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.6.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.6.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.6.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.7.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.7.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.7.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.8.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.8.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.8.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.9.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.9.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.9.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.10.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.10.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.10.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.11.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.11.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.11.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.12.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.12.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.12.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.13.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.13.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.13.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.14.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.14.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.14.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.15.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.15.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.15.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.16.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.16.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.16.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.17.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.17.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.17.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.18.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.18.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.18.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.19.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.19.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.19.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.20.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.20.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.20.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.21.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.21.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.21.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.22.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.22.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.22.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.23.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.23.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.23.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.24.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.24.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.24.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.25.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.25.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.25.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.26.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.26.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.26.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.27.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.27.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.27.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.28.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.28.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.28.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.29.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.29.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.29.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.30.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.30.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.30.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.31.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.31.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.31.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.32.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.32.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.32.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.33.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.33.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.33.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.34.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.34.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.34.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.35.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.35.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.35.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.36.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.36.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.36.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.37.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.37.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.37.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.38.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.38.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.38.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.39.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.39.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.39.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.40.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.40.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.40.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.41.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.41.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.41.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.42.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.42.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.42.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.43.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.43.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.43.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.44.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.44.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.44.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.45.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.45.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.45.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.46.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.46.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.46.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.47.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.47.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.47.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.48.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.48.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.48.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.49.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.49.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.49.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.50.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.50.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.50.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.51.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.51.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.51.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.52.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.52.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.52.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.53.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.53.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.53.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.54.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.54.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.54.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.55.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.55.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.55.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.56.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.56.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.56.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.57.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.57.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.57.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.58.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.58.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.58.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.59.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.59.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.59.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.60.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.60.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.60.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.61.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.61.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.61.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.62.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.62.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.62.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.63.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.63.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.63.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.64.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.64.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.64.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.65.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.65.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.65.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.66.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.66.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.66.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.67.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.67.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.67.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.68.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.68.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.68.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.69.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.69.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.69.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.70.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.70.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.70.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.71.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.71.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.71.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.72.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.72.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.72.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.73.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.73.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.73.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.74.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.74.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.74.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.75.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.75.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.75.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.76.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.76.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.76.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.77.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.77.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.77.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.78.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.78.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.78.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.79.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.79.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.79.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.80.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.80.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.80.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.81.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.81.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.81.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.82.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.82.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.82.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.83.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.83.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.83.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.84.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.84.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.84.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.85.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.85.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.85.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.86.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.86.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.86.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.87.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.87.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.87.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.88.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.88.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.88.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.89.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.89.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.89.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.90.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.90.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.90.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.91.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.91.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.91.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.92.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.92.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.92.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.93.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.93.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.93.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.94.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.94.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.94.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.95.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.95.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.95.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.96.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.96.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.96.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.97.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.97.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.97.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.98.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.98.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.98.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.99.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.99.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.99.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.100.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.100.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.100.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.101.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.101.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.101.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.102.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.102.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.102.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.103.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.103.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.103.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.104.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.104.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.104.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.105.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.105.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.105.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.106.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.106.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.106.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.107.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.107.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.107.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.108.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.108.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.108.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.109.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.109.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.109.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.110.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.110.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.110.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.111.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.111.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.111.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.112.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.112.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.112.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.113.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.113.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.113.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.114.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.114.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.114.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.115.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.115.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.115.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.116.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.116.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.116.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.117.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.117.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.117.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.118.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.118.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.118.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.119.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.119.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.119.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.120.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.120.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.120.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.121.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.121.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.121.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.122.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.122.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.122.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.123.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.123.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.123.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.124.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.124.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.124.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.125.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.125.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.125.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.126.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.126.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.126.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.127.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.127.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.127.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.128.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.128.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.128.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.129.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.129.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.129.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.130.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.130.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.130.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.131.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.131.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.131.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.132.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.132.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.132.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.133.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.133.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.133.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.134.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.134.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.134.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.135.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.135.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.135.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.136.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.136.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.136.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.137.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.137.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.137.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.138.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.138.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.138.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.139.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.139.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.139.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.140.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.140.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.140.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.141.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.141.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.141.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.142.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.142.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.142.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.143.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.143.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.143.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.144.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.144.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.144.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.145.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.145.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.145.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.146.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.146.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.146.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.147.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.147.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.147.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.148.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.148.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.148.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.149.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.149.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.149.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.150.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.150.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.150.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.151.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.151.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.151.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.152.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.152.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.152.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.153.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.153.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.153.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.154.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.154.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.154.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.155.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.155.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.155.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.156.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.156.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.156.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.157.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.157.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.157.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.158.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.158.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.158.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.159.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.159.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.159.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.160.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.160.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.160.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.161.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.161.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.161.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.162.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.162.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.162.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.163.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.163.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.163.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.164.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.164.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.164.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.165.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.165.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.165.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.166.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.166.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.166.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.167.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.167.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.167.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.168.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.168.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.168.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.169.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.169.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.169.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.170.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.170.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.170.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.171.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.171.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.171.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.172.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.172.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.172.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.173.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.173.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.173.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.174.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.174.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.174.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.175.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.175.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.175.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.176.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.176.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.176.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.177.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.177.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.177.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.178.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.178.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.178.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.179.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.179.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.179.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.180.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.180.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.180.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.181.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.181.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.181.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.182.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.182.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.182.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.183.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.183.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.183.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.184.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.184.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.184.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.185.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.185.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.185.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.186.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.186.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.186.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.187.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.187.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.187.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.188.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.188.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.188.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.189.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.189.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.189.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.190.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.190.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.190.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.191.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.191.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.191.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.192.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.192.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.192.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.193.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.193.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.193.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.194.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.194.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.194.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.195.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.195.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.195.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.196.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.196.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.196.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.197.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.197.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.197.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.198.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.198.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.198.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.199.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.199.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.199.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.200.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.200.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.200.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.201.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.201.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.201.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.202.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.202.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.202.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.203.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.203.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.203.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.204.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.204.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.204.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.205.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.205.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.205.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.206.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.206.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.206.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.207.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.207.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.207.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.208.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.208.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.208.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.209.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.209.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.209.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.210.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.210.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.210.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.211.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.211.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.211.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.212.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.212.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.212.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.213.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.213.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.213.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.214.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.214.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.214.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.215.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.215.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.215.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.216.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.216.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.216.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.217.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.217.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.217.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.218.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.218.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.218.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.219.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.219.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.219.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.220.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.220.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.220.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.221.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.221.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.221.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.222.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.222.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.222.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.223.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.223.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.223.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.224.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.224.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.224.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.225.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.225.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.225.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.226.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.226.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.226.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.227.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.227.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.227.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.228.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.228.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.228.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.229.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.229.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.229.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.230.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.230.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.230.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.231.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.231.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.231.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.232.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.232.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.232.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.233.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.233.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.233.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.234.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.234.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.234.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.235.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.235.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.235.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.236.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.236.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.236.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.237.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.237.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.237.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.238.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.238.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.238.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.239.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.239.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.239.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.240.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.240.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.240.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.241.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.241.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.241.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.242.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.242.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.242.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.243.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.243.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.243.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.244.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.244.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.244.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.245.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.245.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.245.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.246.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.246.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.246.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.247.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.247.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.247.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.248.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.248.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.248.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.249.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.249.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.249.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.250.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.250.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.250.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.251.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.251.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.251.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.252.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.252.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.252.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.253.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.253.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.253.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.254.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.254.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.254.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.255.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.255.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.255.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.9.input_layernorm.weight": "model-00021-of-000163.safetensors", + "model.layers.9.post_attention_layernorm.weight": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.q_a_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.q_a_layernorm.weight": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.q_b_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.kv_a_proj_with_mqa.weight": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.kv_a_layernorm.weight": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.kv_b_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.o_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.gate.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.gate.e_score_correction_bias": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.shared_experts.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.shared_experts.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.shared_experts.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.0.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.0.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.0.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.1.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.1.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.1.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.2.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.2.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.2.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.3.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.3.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.3.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.4.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.4.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.4.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.5.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.5.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.5.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.6.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.6.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.6.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.7.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.7.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.7.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.8.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.8.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.8.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.9.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.9.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.9.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.10.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.10.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.10.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.11.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.11.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.11.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.12.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.12.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.12.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.13.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.13.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.13.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.14.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.14.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.14.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.15.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.15.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.15.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.16.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.16.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.16.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.17.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.17.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.17.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.18.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.18.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.18.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.19.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.19.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.19.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.20.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.20.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.20.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.21.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.21.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.21.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.22.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.22.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.22.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.23.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.23.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.23.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.24.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.24.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.24.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.25.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.25.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.25.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.26.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.26.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.26.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.27.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.27.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.27.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.28.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.28.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.28.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.29.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.29.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.29.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.30.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.30.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.30.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.31.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.31.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.31.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.32.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.32.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.32.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.33.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.33.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.33.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.34.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.34.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.34.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.35.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.35.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.35.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.36.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.36.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.36.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.37.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.37.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.37.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.38.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.38.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.38.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.39.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.39.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.39.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.40.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.40.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.40.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.41.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.41.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.41.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.42.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.42.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.42.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.43.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.43.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.43.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.44.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.44.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.44.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.45.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.45.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.45.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.46.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.46.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.46.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.47.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.47.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.47.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.48.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.48.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.48.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.49.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.49.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.49.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.50.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.50.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.50.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.51.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.51.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.51.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.52.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.52.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.52.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.53.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.53.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.53.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.54.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.54.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.54.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.55.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.55.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.55.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.56.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.56.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.56.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.57.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.57.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.57.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.58.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.58.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.58.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.59.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.59.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.59.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.60.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.60.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.60.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.61.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.61.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.61.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.62.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.62.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.62.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.63.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.63.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.63.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.64.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.64.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.64.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.65.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.65.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.65.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.66.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.66.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.66.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.67.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.67.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.67.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.68.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.68.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.68.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.69.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.69.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.69.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.70.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.70.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.70.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.71.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.71.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.71.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.72.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.72.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.72.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.73.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.73.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.73.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.74.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.74.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.74.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.75.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.75.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.75.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.76.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.76.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.76.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.77.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.77.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.77.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.78.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.78.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.78.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.79.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.79.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.79.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.80.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.80.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.80.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.81.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.81.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.81.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.82.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.82.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.82.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.83.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.83.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.83.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.84.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.84.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.84.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.85.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.85.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.85.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.86.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.86.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.86.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.87.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.87.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.87.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.88.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.88.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.88.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.89.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.89.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.89.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.90.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.90.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.90.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.91.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.91.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.91.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.92.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.92.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.92.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.93.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.93.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.93.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.94.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.94.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.94.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.95.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.95.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.95.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.96.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.96.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.96.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.97.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.97.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.97.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.98.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.98.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.98.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.99.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.99.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.99.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.100.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.100.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.100.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.101.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.101.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.101.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.102.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.102.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.102.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.103.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.103.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.103.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.104.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.104.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.104.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.105.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.105.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.105.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.106.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.106.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.106.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.107.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.107.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.107.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.108.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.108.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.108.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.109.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.109.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.109.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.110.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.110.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.110.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.111.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.111.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.111.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.112.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.112.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.112.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.113.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.113.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.113.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.114.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.114.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.114.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.115.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.115.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.115.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.116.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.116.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.116.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.117.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.117.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.117.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.118.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.118.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.118.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.119.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.119.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.119.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.120.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.120.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.120.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.121.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.121.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.121.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.122.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.122.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.122.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.123.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.123.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.123.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.124.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.124.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.124.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.125.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.125.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.125.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.126.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.126.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.126.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.127.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.127.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.127.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.128.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.128.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.128.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.129.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.129.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.129.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.130.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.130.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.130.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.131.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.131.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.131.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.132.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.132.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.132.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.133.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.133.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.133.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.134.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.134.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.134.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.135.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.135.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.135.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.136.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.136.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.136.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.137.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.137.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.137.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.138.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.138.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.138.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.139.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.139.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.139.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.140.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.140.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.140.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.141.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.141.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.141.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.142.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.142.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.142.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.143.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.143.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.143.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.144.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.144.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.144.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.145.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.145.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.145.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.146.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.146.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.146.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.147.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.147.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.147.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.148.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.148.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.148.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.149.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.149.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.149.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.150.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.150.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.150.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.151.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.151.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.151.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.152.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.152.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.152.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.153.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.153.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.153.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.154.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.154.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.154.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.155.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.155.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.155.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.156.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.156.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.156.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.157.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.157.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.157.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.158.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.158.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.158.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.159.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.159.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.159.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.160.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.160.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.160.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.161.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.161.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.161.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.162.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.162.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.162.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.163.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.163.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.163.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.164.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.164.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.164.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.165.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.165.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.165.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.166.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.166.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.166.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.167.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.167.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.167.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.168.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.168.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.168.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.169.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.169.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.169.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.170.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.170.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.170.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.171.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.171.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.171.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.172.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.172.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.172.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.173.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.173.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.173.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.174.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.174.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.174.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.175.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.175.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.175.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.176.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.176.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.176.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.177.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.177.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.177.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.178.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.178.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.178.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.179.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.179.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.179.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.180.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.180.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.180.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.181.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.181.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.181.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.182.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.182.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.182.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.183.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.183.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.183.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.184.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.184.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.184.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.185.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.185.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.185.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.186.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.186.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.186.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.187.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.187.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.187.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.188.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.188.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.188.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.189.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.189.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.189.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.190.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.190.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.190.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.191.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.191.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.191.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.192.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.192.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.192.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.193.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.193.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.193.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.194.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.194.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.194.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.195.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.195.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.195.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.196.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.196.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.196.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.197.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.197.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.197.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.198.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.198.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.198.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.199.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.199.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.199.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.200.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.200.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.200.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.201.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.201.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.201.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.202.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.202.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.202.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.203.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.203.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.203.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.204.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.204.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.204.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.205.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.205.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.205.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.206.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.206.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.206.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.207.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.207.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.207.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.208.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.208.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.208.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.209.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.209.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.209.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.210.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.210.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.210.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.211.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.211.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.211.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.212.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.212.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.212.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.213.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.213.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.213.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.214.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.214.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.214.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.215.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.215.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.215.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.216.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.216.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.216.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.217.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.217.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.217.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.218.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.218.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.218.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.219.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.219.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.219.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.220.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.220.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.220.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.221.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.221.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.221.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.222.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.222.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.222.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.223.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.223.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.223.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.224.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.224.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.224.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.225.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.225.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.225.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.226.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.226.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.226.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.227.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.227.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.227.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.228.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.228.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.228.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.229.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.229.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.229.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.230.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.230.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.230.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.231.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.231.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.231.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.232.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.232.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.232.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.233.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.233.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.233.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.234.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.234.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.234.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.235.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.235.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.235.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.236.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.236.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.236.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.237.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.237.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.237.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.238.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.238.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.238.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.239.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.239.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.239.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.240.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.240.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.240.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.241.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.241.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.241.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.242.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.242.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.242.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.243.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.243.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.243.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.244.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.244.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.244.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.245.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.245.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.245.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.246.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.246.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.246.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.247.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.247.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.247.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.248.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.248.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.248.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.249.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.249.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.249.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.250.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.250.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.250.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.251.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.251.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.251.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.252.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.252.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.252.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.253.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.253.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.253.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.254.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.254.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.254.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.255.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.255.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.255.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.input_layernorm.weight": "model-00023-of-000163.safetensors", + "model.layers.10.post_attention_layernorm.weight": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.q_a_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.q_a_layernorm.weight": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.q_b_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.kv_a_proj_with_mqa.weight": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.kv_a_layernorm.weight": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.kv_b_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.o_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.gate.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.gate.e_score_correction_bias": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.shared_experts.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.shared_experts.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.shared_experts.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.0.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.0.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.0.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.1.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.1.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.1.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.2.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.2.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.2.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.3.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.3.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.3.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.4.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.4.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.4.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.5.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.5.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.5.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.6.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.6.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.6.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.7.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.7.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.7.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.8.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.8.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.8.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.9.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.9.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.9.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.10.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.10.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.10.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.11.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.11.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.11.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.12.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.12.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.12.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.13.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.13.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.13.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.14.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.14.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.14.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.15.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.15.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.15.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.16.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.16.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.16.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.17.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.17.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.17.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.18.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.18.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.18.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.19.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.19.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.19.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.20.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.20.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.20.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.21.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.21.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.21.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.22.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.22.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.22.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.23.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.23.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.23.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.24.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.24.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.24.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.25.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.25.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.25.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.26.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.26.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.26.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.27.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.27.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.27.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.28.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.28.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.28.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.29.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.29.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.29.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.30.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.30.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.30.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.31.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.31.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.31.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.32.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.32.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.32.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.33.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.33.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.33.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.34.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.34.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.34.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.35.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.35.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.35.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.36.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.36.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.36.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.37.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.37.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.37.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.38.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.38.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.38.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.39.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.39.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.39.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.40.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.40.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.40.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.41.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.41.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.41.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.42.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.42.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.42.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.43.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.43.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.43.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.44.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.44.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.44.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.45.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.45.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.45.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.46.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.46.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.46.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.47.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.47.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.47.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.48.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.48.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.48.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.49.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.49.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.49.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.50.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.50.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.50.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.51.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.51.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.51.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.52.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.52.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.52.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.53.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.53.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.53.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.54.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.54.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.54.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.55.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.55.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.55.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.56.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.56.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.56.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.57.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.57.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.57.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.58.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.58.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.58.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.59.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.59.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.59.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.60.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.60.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.60.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.61.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.61.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.61.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.62.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.62.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.62.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.63.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.63.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.63.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.64.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.64.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.64.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.65.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.65.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.65.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.66.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.66.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.66.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.67.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.67.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.67.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.68.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.68.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.68.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.69.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.69.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.69.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.70.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.70.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.70.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.71.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.71.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.71.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.72.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.72.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.72.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.73.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.73.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.73.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.74.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.74.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.74.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.75.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.75.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.75.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.76.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.76.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.76.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.77.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.77.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.77.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.78.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.78.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.78.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.79.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.79.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.79.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.80.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.80.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.80.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.81.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.81.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.81.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.82.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.82.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.82.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.83.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.83.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.83.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.84.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.84.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.84.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.85.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.85.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.85.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.86.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.86.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.86.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.87.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.87.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.87.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.88.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.88.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.88.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.89.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.89.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.89.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.90.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.90.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.90.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.91.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.91.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.91.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.92.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.92.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.92.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.93.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.93.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.93.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.94.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.94.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.94.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.95.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.95.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.95.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.96.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.96.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.96.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.97.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.97.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.97.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.98.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.98.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.98.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.99.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.99.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.99.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.100.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.100.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.100.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.101.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.101.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.101.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.102.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.102.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.102.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.103.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.103.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.103.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.104.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.104.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.104.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.105.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.105.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.105.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.106.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.106.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.106.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.107.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.107.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.107.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.108.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.108.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.108.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.109.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.109.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.109.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.110.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.110.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.110.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.111.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.111.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.111.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.112.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.112.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.112.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.113.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.113.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.113.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.114.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.114.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.114.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.115.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.115.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.115.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.116.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.116.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.116.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.117.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.117.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.117.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.118.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.118.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.118.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.119.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.119.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.119.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.120.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.120.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.120.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.121.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.121.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.121.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.122.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.122.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.122.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.123.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.123.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.123.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.124.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.124.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.124.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.125.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.125.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.125.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.126.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.126.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.126.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.127.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.127.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.127.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.128.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.128.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.128.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.129.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.129.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.129.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.130.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.130.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.130.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.131.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.131.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.131.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.132.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.132.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.132.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.133.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.133.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.133.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.134.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.134.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.134.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.135.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.135.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.135.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.136.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.136.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.136.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.137.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.137.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.137.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.138.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.138.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.138.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.139.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.139.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.139.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.140.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.140.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.140.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.141.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.141.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.141.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.142.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.142.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.142.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.143.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.143.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.143.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.144.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.144.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.144.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.145.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.145.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.145.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.146.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.146.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.146.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.147.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.147.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.147.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.148.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.148.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.148.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.149.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.149.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.149.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.150.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.150.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.150.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.151.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.151.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.151.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.152.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.152.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.152.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.153.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.153.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.153.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.154.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.154.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.154.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.155.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.155.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.155.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.156.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.156.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.156.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.157.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.157.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.157.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.158.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.158.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.158.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.159.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.159.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.159.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.160.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.160.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.160.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.161.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.161.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.161.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.162.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.162.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.162.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.163.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.163.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.163.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.164.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.164.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.164.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.165.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.165.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.165.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.166.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.166.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.166.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.167.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.167.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.167.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.168.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.168.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.168.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.169.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.169.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.169.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.170.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.170.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.170.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.171.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.171.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.171.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.172.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.172.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.172.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.173.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.173.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.173.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.174.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.174.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.174.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.175.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.175.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.175.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.176.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.176.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.176.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.177.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.177.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.177.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.178.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.178.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.178.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.179.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.179.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.179.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.180.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.180.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.180.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.181.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.181.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.181.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.182.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.182.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.182.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.183.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.183.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.183.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.184.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.184.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.184.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.185.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.185.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.185.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.186.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.186.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.186.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.187.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.187.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.187.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.188.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.188.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.188.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.189.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.189.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.189.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.190.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.190.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.190.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.191.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.191.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.191.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.192.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.192.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.192.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.193.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.193.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.193.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.194.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.194.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.194.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.195.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.195.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.195.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.196.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.196.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.196.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.197.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.197.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.197.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.198.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.198.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.198.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.199.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.199.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.199.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.200.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.200.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.200.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.201.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.201.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.201.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.202.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.202.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.202.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.203.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.203.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.203.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.204.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.204.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.204.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.205.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.205.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.205.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.206.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.206.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.206.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.207.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.207.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.207.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.208.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.208.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.208.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.209.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.209.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.209.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.210.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.210.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.210.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.211.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.211.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.211.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.212.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.212.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.212.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.213.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.213.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.213.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.214.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.214.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.214.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.215.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.215.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.215.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.216.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.216.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.216.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.217.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.217.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.217.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.218.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.218.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.218.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.219.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.219.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.219.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.220.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.220.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.220.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.221.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.221.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.221.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.222.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.222.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.222.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.223.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.223.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.223.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.224.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.224.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.224.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.225.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.225.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.225.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.226.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.226.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.226.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.227.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.227.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.227.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.228.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.228.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.228.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.229.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.229.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.229.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.230.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.230.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.230.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.231.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.231.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.231.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.232.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.232.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.232.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.233.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.233.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.233.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.234.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.234.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.234.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.235.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.235.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.235.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.236.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.236.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.236.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.237.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.237.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.237.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.238.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.238.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.238.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.239.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.239.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.239.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.240.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.240.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.240.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.241.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.241.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.241.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.242.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.242.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.242.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.243.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.243.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.243.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.244.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.244.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.244.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.245.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.245.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.245.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.246.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.246.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.246.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.247.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.247.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.247.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.248.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.248.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.248.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.249.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.249.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.249.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.250.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.250.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.250.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.251.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.251.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.251.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.252.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.252.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.252.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.253.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.253.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.253.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.254.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.254.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.254.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.255.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.255.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.255.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.input_layernorm.weight": "model-00026-of-000163.safetensors", + "model.layers.11.post_attention_layernorm.weight": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.q_a_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.q_a_layernorm.weight": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.q_b_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.kv_a_proj_with_mqa.weight": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.kv_a_layernorm.weight": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.kv_b_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.o_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.gate.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.gate.e_score_correction_bias": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.shared_experts.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.shared_experts.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.shared_experts.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.0.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.0.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.0.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.1.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.1.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.1.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.2.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.2.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.2.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.3.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.3.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.3.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.4.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.4.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.4.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.5.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.5.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.5.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.6.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.6.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.6.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.7.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.7.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.7.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.8.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.8.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.8.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.9.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.9.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.9.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.10.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.10.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.10.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.11.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.11.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.11.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.12.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.12.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.12.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.13.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.13.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.13.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.14.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.14.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.14.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.15.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.15.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.15.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.16.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.16.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.16.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.17.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.17.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.17.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.18.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.18.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.18.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.19.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.19.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.19.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.20.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.20.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.20.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.21.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.21.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.21.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.22.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.22.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.22.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.23.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.23.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.23.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.24.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.24.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.24.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.25.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.25.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.25.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.26.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.26.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.26.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.27.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.27.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.27.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.28.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.28.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.28.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.29.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.29.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.29.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.30.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.30.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.30.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.31.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.31.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.31.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.32.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.32.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.32.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.33.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.33.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.33.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.34.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.34.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.34.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.35.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.35.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.35.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.36.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.36.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.36.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.37.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.37.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.37.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.38.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.38.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.38.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.39.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.39.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.39.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.40.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.40.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.40.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.41.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.41.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.41.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.42.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.42.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.42.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.43.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.43.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.43.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.44.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.44.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.44.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.45.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.45.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.45.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.46.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.46.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.46.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.47.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.47.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.47.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.48.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.48.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.48.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.49.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.49.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.49.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.50.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.50.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.50.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.51.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.51.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.51.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.52.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.52.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.52.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.53.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.53.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.53.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.54.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.54.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.54.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.55.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.55.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.55.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.56.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.56.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.56.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.57.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.57.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.57.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.58.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.58.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.58.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.59.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.59.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.59.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.60.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.60.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.60.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.61.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.61.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.61.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.62.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.62.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.62.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.63.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.63.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.63.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.64.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.64.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.64.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.65.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.65.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.65.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.66.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.66.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.66.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.67.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.67.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.67.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.68.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.68.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.68.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.69.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.69.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.69.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.70.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.70.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.70.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.71.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.71.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.71.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.72.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.72.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.72.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.73.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.73.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.73.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.74.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.74.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.74.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.75.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.75.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.75.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.76.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.76.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.76.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.77.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.77.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.77.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.78.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.78.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.78.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.79.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.79.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.79.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.80.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.80.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.80.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.81.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.81.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.81.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.82.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.82.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.82.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.83.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.83.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.83.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.84.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.84.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.84.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.85.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.85.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.85.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.86.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.86.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.86.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.87.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.87.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.87.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.88.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.88.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.88.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.89.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.89.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.89.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.90.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.90.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.90.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.91.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.91.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.91.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.92.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.92.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.92.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.93.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.93.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.93.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.94.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.94.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.94.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.95.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.95.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.95.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.96.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.96.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.96.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.97.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.97.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.97.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.98.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.98.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.98.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.99.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.99.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.99.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.100.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.100.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.100.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.101.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.101.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.101.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.102.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.102.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.102.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.103.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.103.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.103.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.104.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.104.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.104.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.105.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.105.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.105.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.106.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.106.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.106.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.107.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.107.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.107.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.108.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.108.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.108.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.109.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.109.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.109.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.110.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.110.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.110.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.111.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.111.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.111.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.112.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.112.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.112.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.113.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.113.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.113.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.114.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.114.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.114.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.115.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.115.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.115.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.116.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.116.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.116.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.117.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.117.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.117.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.118.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.118.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.118.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.119.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.119.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.119.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.120.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.120.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.120.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.121.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.121.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.121.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.122.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.122.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.122.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.123.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.123.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.123.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.124.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.124.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.124.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.125.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.125.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.125.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.126.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.126.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.126.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.127.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.127.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.127.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.128.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.128.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.128.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.129.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.129.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.129.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.130.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.130.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.130.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.131.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.131.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.131.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.132.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.132.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.132.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.133.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.133.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.133.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.134.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.134.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.134.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.135.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.135.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.135.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.136.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.136.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.136.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.137.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.137.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.137.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.138.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.138.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.138.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.139.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.139.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.139.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.140.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.140.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.140.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.141.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.141.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.141.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.142.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.142.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.142.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.143.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.143.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.143.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.144.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.144.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.144.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.145.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.145.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.145.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.146.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.146.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.146.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.147.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.147.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.147.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.148.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.148.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.148.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.149.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.149.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.149.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.150.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.150.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.150.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.151.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.151.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.151.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.152.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.152.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.152.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.153.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.153.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.153.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.154.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.154.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.154.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.155.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.155.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.155.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.156.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.156.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.156.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.157.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.157.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.157.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.158.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.158.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.158.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.159.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.159.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.159.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.160.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.160.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.160.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.161.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.161.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.161.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.162.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.162.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.162.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.163.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.163.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.163.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.164.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.164.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.164.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.165.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.165.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.165.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.166.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.166.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.166.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.167.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.167.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.167.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.168.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.168.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.168.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.169.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.169.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.169.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.170.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.170.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.170.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.171.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.171.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.171.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.172.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.172.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.172.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.173.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.173.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.173.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.174.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.174.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.174.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.175.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.175.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.175.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.176.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.176.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.176.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.177.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.177.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.177.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.178.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.178.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.178.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.179.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.179.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.179.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.180.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.180.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.180.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.181.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.181.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.181.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.182.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.182.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.182.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.183.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.183.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.183.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.184.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.184.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.184.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.185.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.185.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.185.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.186.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.186.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.186.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.187.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.187.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.187.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.188.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.188.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.188.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.189.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.189.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.189.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.190.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.190.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.190.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.191.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.191.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.191.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.192.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.192.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.192.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.193.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.193.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.193.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.194.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.194.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.194.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.195.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.195.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.195.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.196.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.196.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.196.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.197.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.197.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.197.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.198.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.198.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.198.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.199.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.199.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.199.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.200.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.200.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.200.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.201.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.201.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.201.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.202.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.202.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.202.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.203.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.203.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.203.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.204.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.204.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.204.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.205.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.205.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.205.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.206.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.206.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.206.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.207.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.207.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.207.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.208.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.208.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.208.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.209.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.209.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.209.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.210.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.210.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.210.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.211.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.211.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.211.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.212.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.212.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.212.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.213.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.213.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.213.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.214.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.214.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.214.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.215.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.215.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.215.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.216.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.216.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.216.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.217.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.217.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.217.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.218.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.218.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.218.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.219.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.219.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.219.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.220.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.220.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.220.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.221.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.221.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.221.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.222.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.222.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.222.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.223.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.223.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.223.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.224.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.224.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.224.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.225.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.225.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.225.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.226.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.226.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.226.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.227.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.227.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.227.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.228.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.228.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.228.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.229.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.229.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.229.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.230.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.230.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.230.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.231.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.231.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.231.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.232.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.232.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.232.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.233.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.233.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.233.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.234.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.234.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.234.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.235.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.235.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.235.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.236.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.236.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.236.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.237.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.237.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.237.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.238.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.238.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.238.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.239.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.239.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.239.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.240.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.240.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.240.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.241.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.241.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.241.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.242.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.242.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.242.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.243.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.243.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.243.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.244.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.244.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.244.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.245.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.245.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.245.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.246.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.246.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.246.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.247.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.247.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.247.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.248.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.248.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.248.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.249.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.249.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.249.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.250.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.250.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.250.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.251.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.251.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.251.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.252.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.252.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.252.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.253.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.253.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.253.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.254.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.254.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.254.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.255.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.255.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.255.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.input_layernorm.weight": "model-00029-of-000163.safetensors", + "model.layers.12.post_attention_layernorm.weight": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.q_a_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.q_a_layernorm.weight": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.q_b_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.kv_a_proj_with_mqa.weight": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.kv_a_layernorm.weight": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.kv_b_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.o_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.gate.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.gate.e_score_correction_bias": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.shared_experts.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.shared_experts.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.shared_experts.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.0.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.0.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.0.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.1.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.1.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.1.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.2.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.2.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.2.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.3.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.3.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.3.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.4.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.4.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.4.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.5.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.5.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.5.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.6.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.6.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.6.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.7.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.7.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.7.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.8.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.8.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.8.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.9.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.9.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.9.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.10.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.10.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.10.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.11.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.11.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.11.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.12.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.12.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.12.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.13.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.13.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.13.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.14.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.14.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.14.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.15.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.15.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.15.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.16.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.16.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.16.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.17.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.17.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.17.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.18.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.18.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.18.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.19.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.19.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.19.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.20.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.20.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.20.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.21.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.21.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.21.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.22.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.22.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.22.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.23.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.23.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.23.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.24.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.24.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.24.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.25.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.25.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.25.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.26.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.26.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.26.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.27.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.27.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.27.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.28.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.28.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.28.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.29.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.29.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.29.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.30.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.30.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.30.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.31.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.31.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.31.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.32.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.32.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.32.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.33.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.33.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.33.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.34.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.34.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.34.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.35.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.35.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.35.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.36.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.36.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.36.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.37.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.37.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.37.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.38.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.38.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.38.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.39.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.39.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.39.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.40.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.40.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.40.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.41.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.41.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.41.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.42.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.42.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.42.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.43.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.43.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.43.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.44.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.44.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.44.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.45.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.45.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.45.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.46.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.46.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.46.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.47.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.47.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.47.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.48.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.48.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.48.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.49.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.49.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.49.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.50.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.50.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.50.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.51.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.51.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.51.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.52.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.52.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.52.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.53.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.53.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.53.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.54.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.54.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.54.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.55.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.55.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.55.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.56.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.56.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.56.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.57.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.57.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.57.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.58.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.58.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.58.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.59.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.59.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.59.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.60.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.60.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.60.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.61.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.61.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.61.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.62.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.62.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.62.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.63.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.63.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.63.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.64.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.64.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.64.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.65.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.65.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.65.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.66.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.66.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.66.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.67.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.67.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.67.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.68.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.68.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.68.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.69.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.69.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.69.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.70.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.70.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.70.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.71.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.71.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.71.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.72.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.72.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.72.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.73.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.73.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.73.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.74.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.74.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.74.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.75.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.75.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.75.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.76.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.76.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.76.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.77.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.77.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.77.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.78.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.78.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.78.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.79.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.79.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.79.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.80.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.80.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.80.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.81.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.81.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.81.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.82.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.82.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.82.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.83.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.83.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.83.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.84.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.84.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.84.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.85.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.85.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.85.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.86.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.86.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.86.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.87.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.87.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.87.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.88.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.88.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.88.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.89.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.89.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.89.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.90.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.90.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.90.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.91.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.91.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.91.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.92.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.92.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.92.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.93.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.93.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.93.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.94.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.94.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.94.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.95.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.95.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.95.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.96.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.96.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.96.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.97.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.97.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.97.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.98.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.98.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.98.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.99.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.99.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.99.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.100.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.100.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.100.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.101.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.101.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.101.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.102.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.102.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.102.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.103.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.103.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.103.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.104.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.104.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.104.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.105.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.105.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.105.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.106.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.106.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.106.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.107.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.107.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.107.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.108.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.108.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.108.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.109.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.109.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.109.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.110.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.110.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.110.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.111.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.111.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.111.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.112.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.112.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.112.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.113.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.113.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.113.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.114.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.114.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.114.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.115.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.115.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.115.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.116.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.116.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.116.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.117.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.117.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.117.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.118.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.118.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.118.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.119.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.119.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.119.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.120.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.120.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.120.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.121.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.121.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.121.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.122.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.122.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.122.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.123.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.123.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.123.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.124.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.124.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.124.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.125.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.125.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.125.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.126.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.126.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.126.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.127.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.127.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.127.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.128.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.128.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.128.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.129.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.129.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.129.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.130.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.130.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.130.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.131.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.131.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.131.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.132.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.132.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.132.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.133.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.133.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.133.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.134.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.134.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.134.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.135.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.135.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.135.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.136.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.136.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.136.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.137.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.137.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.137.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.138.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.138.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.138.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.139.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.139.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.139.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.140.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.140.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.140.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.141.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.141.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.141.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.142.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.142.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.142.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.143.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.143.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.143.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.144.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.144.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.144.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.145.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.145.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.145.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.146.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.146.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.146.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.147.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.147.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.147.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.148.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.148.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.148.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.149.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.149.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.149.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.150.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.150.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.150.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.151.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.151.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.151.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.152.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.152.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.152.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.153.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.153.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.153.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.154.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.154.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.154.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.155.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.155.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.155.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.156.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.156.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.156.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.157.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.157.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.157.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.158.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.158.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.158.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.159.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.159.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.159.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.160.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.160.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.160.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.161.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.161.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.161.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.162.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.162.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.162.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.163.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.163.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.163.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.164.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.164.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.164.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.165.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.165.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.165.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.166.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.166.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.166.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.167.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.167.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.167.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.168.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.168.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.168.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.169.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.169.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.169.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.170.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.170.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.170.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.171.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.171.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.171.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.172.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.172.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.172.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.173.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.173.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.173.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.174.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.174.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.174.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.175.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.175.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.175.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.176.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.176.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.176.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.177.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.177.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.177.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.178.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.178.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.178.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.179.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.179.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.179.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.180.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.180.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.180.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.181.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.181.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.181.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.182.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.182.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.182.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.183.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.183.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.183.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.184.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.184.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.184.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.185.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.185.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.185.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.186.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.186.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.186.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.187.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.187.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.187.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.188.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.188.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.188.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.189.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.189.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.189.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.190.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.190.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.190.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.191.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.191.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.191.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.192.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.192.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.192.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.193.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.193.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.193.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.194.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.194.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.194.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.195.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.195.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.195.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.196.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.196.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.196.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.197.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.197.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.197.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.198.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.198.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.198.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.199.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.199.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.199.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.200.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.200.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.200.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.201.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.201.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.201.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.202.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.202.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.202.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.203.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.203.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.203.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.204.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.204.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.204.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.205.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.205.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.205.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.206.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.206.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.206.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.207.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.207.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.207.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.208.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.208.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.208.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.209.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.209.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.209.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.210.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.210.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.210.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.211.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.211.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.211.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.212.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.212.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.212.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.213.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.213.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.213.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.214.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.214.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.214.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.215.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.215.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.215.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.216.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.216.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.216.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.217.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.217.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.217.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.218.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.218.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.218.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.219.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.219.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.219.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.220.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.220.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.220.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.221.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.221.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.221.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.222.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.222.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.222.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.223.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.223.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.223.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.224.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.224.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.224.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.225.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.225.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.225.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.226.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.226.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.226.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.227.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.227.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.227.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.228.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.228.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.228.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.229.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.229.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.229.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.230.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.230.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.230.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.231.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.231.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.231.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.232.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.232.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.232.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.233.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.233.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.233.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.234.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.234.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.234.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.235.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.235.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.235.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.236.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.236.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.236.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.237.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.237.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.237.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.238.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.238.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.238.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.239.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.239.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.239.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.240.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.240.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.240.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.241.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.241.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.241.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.242.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.242.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.242.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.243.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.243.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.243.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.244.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.244.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.244.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.245.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.245.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.245.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.246.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.246.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.246.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.247.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.247.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.247.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.248.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.248.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.248.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.249.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.249.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.249.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.250.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.250.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.250.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.251.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.251.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.251.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.252.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.252.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.252.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.253.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.253.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.253.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.254.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.254.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.254.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.255.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.255.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.255.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.input_layernorm.weight": "model-00031-of-000163.safetensors", + "model.layers.13.post_attention_layernorm.weight": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.q_a_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.q_a_layernorm.weight": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.q_b_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.kv_a_proj_with_mqa.weight": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.kv_a_layernorm.weight": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.kv_b_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.o_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.gate.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.gate.e_score_correction_bias": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.shared_experts.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.shared_experts.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.shared_experts.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.0.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.0.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.0.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.1.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.1.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.1.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.2.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.2.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.2.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.3.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.3.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.3.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.4.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.4.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.4.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.5.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.5.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.5.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.6.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.6.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.6.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.7.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.7.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.7.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.8.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.8.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.8.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.9.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.9.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.9.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.10.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.10.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.10.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.11.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.11.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.11.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.12.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.12.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.12.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.13.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.13.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.13.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.14.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.14.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.14.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.15.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.15.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.15.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.16.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.16.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.16.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.17.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.17.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.17.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.18.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.18.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.18.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.19.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.19.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.19.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.20.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.20.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.20.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.21.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.21.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.21.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.22.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.22.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.22.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.23.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.23.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.23.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.24.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.24.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.24.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.25.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.25.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.25.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.26.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.26.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.26.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.27.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.27.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.27.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.28.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.28.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.28.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.29.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.29.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.29.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.30.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.30.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.30.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.31.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.31.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.31.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.32.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.32.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.32.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.33.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.33.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.33.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.34.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.34.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.34.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.35.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.35.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.35.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.36.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.36.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.36.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.37.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.37.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.37.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.38.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.38.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.38.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.39.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.39.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.39.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.40.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.40.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.40.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.41.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.41.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.41.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.42.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.42.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.42.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.43.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.43.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.43.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.44.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.44.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.44.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.45.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.45.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.45.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.46.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.46.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.46.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.47.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.47.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.47.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.48.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.48.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.48.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.49.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.49.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.49.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.50.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.50.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.50.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.51.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.51.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.51.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.52.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.52.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.52.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.53.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.53.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.53.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.54.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.54.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.54.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.55.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.55.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.55.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.56.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.56.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.56.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.57.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.57.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.57.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.58.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.58.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.58.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.59.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.59.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.59.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.60.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.60.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.60.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.61.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.61.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.61.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.62.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.62.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.62.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.63.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.63.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.63.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.64.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.64.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.64.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.65.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.65.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.65.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.66.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.66.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.66.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.67.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.67.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.67.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.68.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.68.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.68.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.69.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.69.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.69.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.70.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.70.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.70.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.71.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.71.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.71.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.72.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.72.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.72.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.73.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.73.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.73.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.74.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.74.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.74.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.75.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.75.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.75.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.76.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.76.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.76.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.77.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.77.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.77.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.78.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.78.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.78.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.79.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.79.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.79.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.80.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.80.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.80.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.81.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.81.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.81.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.82.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.82.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.82.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.83.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.83.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.83.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.84.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.84.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.84.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.85.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.85.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.85.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.86.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.86.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.86.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.87.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.87.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.87.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.88.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.88.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.88.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.89.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.89.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.89.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.90.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.90.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.90.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.91.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.91.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.91.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.92.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.92.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.92.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.93.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.93.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.93.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.94.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.94.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.94.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.95.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.95.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.95.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.96.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.96.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.96.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.97.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.97.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.97.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.98.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.98.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.98.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.99.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.99.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.99.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.100.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.100.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.100.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.101.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.101.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.101.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.102.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.102.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.102.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.103.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.103.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.103.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.104.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.104.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.104.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.105.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.105.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.105.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.106.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.106.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.106.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.107.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.107.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.107.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.108.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.108.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.108.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.109.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.109.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.109.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.110.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.110.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.110.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.111.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.111.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.111.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.112.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.112.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.112.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.113.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.113.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.113.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.114.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.114.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.114.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.115.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.115.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.115.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.116.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.116.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.116.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.117.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.117.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.117.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.118.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.118.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.118.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.119.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.119.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.119.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.120.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.120.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.120.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.121.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.121.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.121.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.122.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.122.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.122.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.123.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.123.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.123.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.124.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.124.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.124.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.125.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.125.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.125.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.126.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.126.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.126.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.127.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.127.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.127.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.128.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.128.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.128.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.129.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.129.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.129.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.130.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.130.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.130.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.131.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.131.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.131.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.132.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.132.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.132.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.133.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.133.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.133.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.134.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.134.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.134.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.135.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.135.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.135.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.136.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.136.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.136.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.137.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.137.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.137.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.138.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.138.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.138.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.139.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.139.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.139.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.140.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.140.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.140.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.141.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.141.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.141.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.142.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.142.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.142.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.143.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.143.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.143.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.144.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.144.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.144.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.145.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.145.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.145.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.146.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.146.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.146.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.147.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.147.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.147.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.148.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.148.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.148.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.149.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.149.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.149.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.150.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.150.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.150.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.151.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.151.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.151.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.152.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.152.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.152.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.153.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.153.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.153.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.154.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.154.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.154.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.155.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.155.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.155.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.156.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.156.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.156.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.157.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.157.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.157.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.158.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.158.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.158.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.159.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.159.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.159.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.160.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.160.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.160.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.161.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.161.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.161.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.162.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.162.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.162.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.163.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.163.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.163.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.164.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.164.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.164.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.165.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.165.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.165.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.166.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.166.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.166.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.167.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.167.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.167.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.168.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.168.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.168.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.169.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.169.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.169.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.170.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.170.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.170.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.171.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.171.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.171.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.172.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.172.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.172.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.173.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.173.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.173.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.174.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.174.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.174.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.175.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.175.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.175.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.176.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.176.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.176.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.177.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.177.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.177.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.178.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.178.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.178.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.179.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.179.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.179.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.180.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.180.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.180.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.181.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.181.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.181.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.182.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.182.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.182.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.183.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.183.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.183.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.184.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.184.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.184.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.185.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.185.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.185.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.186.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.186.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.186.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.187.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.187.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.187.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.188.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.188.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.188.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.189.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.189.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.189.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.190.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.190.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.190.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.191.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.191.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.191.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.192.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.192.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.192.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.193.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.193.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.193.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.194.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.194.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.194.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.195.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.195.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.195.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.196.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.196.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.196.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.197.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.197.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.197.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.198.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.198.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.198.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.199.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.199.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.199.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.200.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.200.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.200.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.201.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.201.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.201.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.202.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.202.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.202.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.203.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.203.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.203.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.204.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.204.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.204.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.205.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.205.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.205.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.206.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.206.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.206.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.207.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.207.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.207.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.208.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.208.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.208.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.209.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.209.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.209.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.210.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.210.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.210.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.211.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.211.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.211.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.212.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.212.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.212.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.213.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.213.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.213.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.214.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.214.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.214.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.215.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.215.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.215.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.216.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.216.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.216.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.217.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.217.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.217.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.218.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.218.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.218.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.219.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.219.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.219.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.220.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.220.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.220.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.221.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.221.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.221.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.222.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.222.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.222.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.223.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.223.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.223.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.224.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.224.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.224.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.225.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.225.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.225.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.226.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.226.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.226.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.227.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.227.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.227.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.228.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.228.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.228.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.229.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.229.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.229.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.230.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.230.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.230.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.231.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.231.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.231.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.232.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.232.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.232.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.233.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.233.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.233.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.234.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.234.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.234.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.235.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.235.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.235.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.236.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.236.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.236.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.237.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.237.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.237.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.238.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.238.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.238.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.239.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.239.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.239.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.240.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.240.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.240.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.241.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.241.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.241.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.242.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.242.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.242.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.243.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.243.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.243.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.244.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.244.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.244.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.245.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.245.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.245.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.246.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.246.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.246.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.247.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.247.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.247.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.248.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.248.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.248.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.249.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.249.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.249.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.250.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.250.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.250.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.251.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.251.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.251.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.252.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.252.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.252.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.253.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.253.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.253.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.254.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.254.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.254.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.255.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.255.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.255.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.input_layernorm.weight": "model-00034-of-000163.safetensors", + "model.layers.14.post_attention_layernorm.weight": "model-00034-of-000163.safetensors", + "model.layers.15.self_attn.q_a_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.self_attn.q_a_layernorm.weight": "model-00035-of-000163.safetensors", + "model.layers.15.self_attn.q_b_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.self_attn.kv_a_proj_with_mqa.weight": "model-00035-of-000163.safetensors", + "model.layers.15.self_attn.kv_a_layernorm.weight": "model-00035-of-000163.safetensors", + "model.layers.15.self_attn.kv_b_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.self_attn.o_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.gate.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.gate.e_score_correction_bias": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.shared_experts.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.shared_experts.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.shared_experts.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.0.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.0.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.0.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.1.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.1.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.1.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.2.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.2.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.2.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.3.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.3.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.3.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.4.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.4.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.4.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.5.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.5.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.5.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.6.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.6.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.6.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.7.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.7.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.7.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.8.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.8.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.8.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.9.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.9.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.9.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.10.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.10.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.10.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.11.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.11.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.11.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.12.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.12.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.12.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.13.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.13.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.13.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.14.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.14.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.14.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.15.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.15.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.15.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.16.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.16.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.16.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.17.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.17.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.17.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.18.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.18.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.18.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.19.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.19.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.19.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.20.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.20.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.20.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.21.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.21.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.21.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.22.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.22.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.22.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.23.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.23.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.23.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.24.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.24.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.24.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.25.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.25.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.25.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.26.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.26.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.26.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.27.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.27.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.27.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.28.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.28.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.28.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.29.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.29.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.29.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.30.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.30.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.30.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.31.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.31.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.31.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.32.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.32.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.32.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.33.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.33.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.33.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.34.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.34.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.34.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.35.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.35.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.35.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.36.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.36.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.36.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.37.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.37.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.37.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.38.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.38.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.38.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.39.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.39.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.39.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.40.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.40.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.40.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.41.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.41.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.41.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.42.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.42.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.42.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.43.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.43.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.43.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.44.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.44.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.44.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.45.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.45.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.45.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.46.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.46.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.46.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.47.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.47.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.47.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.48.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.48.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.48.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.49.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.49.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.49.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.50.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.50.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.50.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.51.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.51.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.51.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.52.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.52.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.52.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.53.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.53.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.53.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.54.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.54.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.54.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.55.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.55.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.55.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.56.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.56.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.56.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.57.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.57.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.57.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.58.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.58.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.58.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.59.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.59.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.59.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.60.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.60.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.60.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.61.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.61.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.61.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.62.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.62.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.62.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.63.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.63.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.63.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.64.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.64.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.64.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.65.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.65.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.65.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.66.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.66.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.66.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.67.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.67.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.67.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.68.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.68.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.68.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.69.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.69.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.69.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.70.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.70.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.70.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.71.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.71.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.71.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.72.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.72.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.72.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.73.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.73.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.73.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.74.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.74.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.74.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.75.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.75.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.75.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.76.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.76.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.76.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.77.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.77.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.77.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.78.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.78.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.78.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.79.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.79.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.79.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.80.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.80.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.80.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.81.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.81.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.81.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.82.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.82.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.82.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.83.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.83.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.83.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.84.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.84.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.84.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.85.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.85.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.85.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.86.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.86.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.86.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.87.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.87.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.87.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.88.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.88.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.88.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.89.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.89.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.89.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.90.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.90.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.90.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.91.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.91.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.91.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.92.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.92.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.92.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.93.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.93.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.93.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.94.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.94.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.94.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.95.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.95.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.95.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.96.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.96.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.96.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.97.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.97.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.97.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.98.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.98.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.98.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.99.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.99.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.99.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.100.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.100.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.100.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.101.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.101.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.101.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.102.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.102.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.102.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.103.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.103.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.103.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.104.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.104.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.104.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.105.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.105.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.105.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.106.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.106.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.106.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.107.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.107.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.107.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.108.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.108.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.108.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.109.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.109.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.109.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.110.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.110.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.110.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.111.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.111.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.111.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.112.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.112.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.112.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.113.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.113.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.113.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.114.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.114.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.114.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.115.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.115.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.115.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.116.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.116.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.116.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.117.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.117.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.117.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.118.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.118.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.118.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.119.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.119.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.119.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.120.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.120.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.120.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.121.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.121.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.121.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.122.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.122.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.122.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.123.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.123.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.123.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.124.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.124.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.124.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.125.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.125.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.125.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.126.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.126.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.126.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.127.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.127.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.127.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.128.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.128.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.128.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.129.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.129.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.129.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.130.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.130.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.130.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.131.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.131.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.131.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.132.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.132.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.132.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.133.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.133.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.133.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.134.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.134.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.134.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.135.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.135.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.135.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.136.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.136.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.136.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.137.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.137.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.137.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.138.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.138.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.138.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.139.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.139.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.139.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.140.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.140.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.140.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.141.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.141.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.141.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.142.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.142.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.142.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.143.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.143.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.143.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.144.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.144.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.144.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.145.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.145.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.145.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.146.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.146.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.146.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.147.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.147.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.147.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.148.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.148.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.148.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.149.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.149.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.149.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.150.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.150.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.150.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.151.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.151.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.151.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.152.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.152.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.152.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.153.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.153.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.153.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.154.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.154.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.154.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.155.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.155.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.155.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.156.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.156.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.156.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.157.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.157.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.157.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.158.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.158.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.158.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.159.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.159.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.159.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.160.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.160.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.160.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.161.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.161.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.161.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.162.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.162.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.162.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.163.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.163.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.163.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.164.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.164.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.164.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.165.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.165.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.165.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.166.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.166.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.166.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.167.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.167.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.167.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.168.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.168.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.168.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.169.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.169.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.169.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.170.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.170.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.170.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.171.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.171.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.171.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.172.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.172.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.172.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.173.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.173.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.173.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.174.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.174.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.174.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.175.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.175.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.175.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.176.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.176.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.176.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.177.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.177.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.177.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.178.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.178.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.178.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.179.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.179.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.179.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.180.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.180.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.180.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.181.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.181.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.181.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.182.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.182.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.182.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.183.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.183.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.183.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.184.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.184.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.184.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.185.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.185.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.185.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.186.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.186.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.186.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.187.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.187.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.187.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.188.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.188.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.188.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.189.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.189.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.189.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.190.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.190.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.190.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.191.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.191.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.191.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.192.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.192.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.192.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.193.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.193.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.193.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.194.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.194.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.194.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.195.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.195.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.195.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.196.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.196.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.196.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.197.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.197.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.197.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.198.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.198.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.198.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.199.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.199.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.199.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.200.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.200.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.200.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.201.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.201.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.201.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.202.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.202.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.202.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.203.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.203.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.203.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.204.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.204.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.204.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.205.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.205.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.205.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.206.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.206.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.206.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.207.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.207.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.207.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.208.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.208.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.208.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.209.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.209.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.209.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.210.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.210.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.210.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.211.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.211.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.211.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.212.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.212.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.212.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.213.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.213.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.213.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.214.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.214.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.214.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.215.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.215.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.215.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.216.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.216.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.216.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.217.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.217.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.217.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.218.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.218.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.218.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.219.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.219.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.219.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.220.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.220.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.220.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.221.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.221.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.221.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.222.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.222.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.222.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.223.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.223.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.223.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.224.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.224.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.224.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.225.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.225.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.225.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.226.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.226.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.226.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.227.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.227.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.227.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.228.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.228.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.228.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.229.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.229.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.229.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.230.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.230.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.230.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.231.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.231.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.231.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.232.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.232.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.232.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.233.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.233.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.233.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.234.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.234.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.234.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.235.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.235.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.235.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.236.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.236.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.236.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.237.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.237.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.237.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.238.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.238.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.238.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.239.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.239.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.239.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.240.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.240.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.240.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.241.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.241.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.241.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.242.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.242.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.242.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.243.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.243.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.243.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.244.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.244.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.244.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.245.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.245.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.245.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.246.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.246.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.246.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.247.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.247.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.247.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.248.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.248.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.248.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.249.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.249.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.249.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.250.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.250.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.250.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.251.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.251.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.251.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.252.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.252.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.252.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.253.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.253.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.253.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.254.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.254.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.254.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.255.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.255.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.255.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.input_layernorm.weight": "model-00037-of-000163.safetensors", + "model.layers.15.post_attention_layernorm.weight": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.q_a_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.q_a_layernorm.weight": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.q_b_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.kv_a_proj_with_mqa.weight": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.kv_a_layernorm.weight": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.kv_b_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.o_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.gate.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.gate.e_score_correction_bias": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.shared_experts.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.shared_experts.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.shared_experts.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.0.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.0.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.0.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.1.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.1.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.1.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.2.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.2.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.2.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.3.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.3.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.3.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.4.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.4.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.4.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.5.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.5.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.5.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.6.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.6.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.6.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.7.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.7.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.7.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.8.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.8.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.8.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.9.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.9.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.9.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.10.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.10.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.10.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.11.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.11.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.11.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.12.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.12.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.12.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.13.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.13.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.13.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.14.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.14.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.14.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.15.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.15.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.15.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.16.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.16.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.16.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.17.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.17.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.17.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.18.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.18.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.18.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.19.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.19.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.19.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.20.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.20.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.20.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.21.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.21.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.21.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.22.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.22.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.22.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.23.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.23.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.23.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.24.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.24.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.24.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.25.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.25.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.25.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.26.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.26.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.26.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.27.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.27.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.27.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.28.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.28.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.28.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.29.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.29.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.29.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.30.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.30.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.30.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.31.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.31.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.31.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.32.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.32.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.32.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.33.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.33.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.33.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.34.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.34.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.34.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.35.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.35.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.35.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.36.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.36.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.36.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.37.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.37.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.37.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.38.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.38.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.38.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.39.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.39.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.39.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.40.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.40.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.40.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.41.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.41.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.41.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.42.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.42.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.42.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.43.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.43.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.43.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.44.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.44.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.44.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.45.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.45.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.45.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.46.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.46.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.46.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.47.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.47.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.47.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.48.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.48.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.48.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.49.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.49.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.49.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.50.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.50.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.50.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.51.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.51.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.51.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.52.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.52.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.52.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.53.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.53.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.53.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.54.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.54.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.54.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.55.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.55.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.55.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.56.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.56.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.56.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.57.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.57.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.57.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.58.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.58.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.58.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.59.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.59.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.59.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.60.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.60.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.60.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.61.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.61.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.61.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.62.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.62.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.62.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.63.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.63.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.63.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.64.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.64.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.64.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.65.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.65.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.65.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.66.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.66.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.66.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.67.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.67.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.67.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.68.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.68.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.68.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.69.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.69.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.69.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.70.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.70.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.70.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.71.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.71.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.71.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.72.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.72.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.72.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.73.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.73.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.73.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.74.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.74.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.74.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.75.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.75.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.75.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.76.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.76.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.76.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.77.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.77.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.77.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.78.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.78.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.78.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.79.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.79.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.79.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.80.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.80.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.80.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.81.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.81.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.81.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.82.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.82.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.82.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.83.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.83.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.83.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.84.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.84.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.84.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.85.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.85.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.85.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.86.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.86.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.86.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.87.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.87.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.87.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.88.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.88.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.88.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.89.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.89.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.89.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.90.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.90.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.90.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.91.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.91.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.91.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.92.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.92.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.92.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.93.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.93.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.93.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.94.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.94.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.94.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.95.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.95.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.95.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.96.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.96.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.96.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.97.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.97.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.97.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.98.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.98.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.98.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.99.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.99.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.99.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.100.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.100.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.100.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.101.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.101.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.101.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.102.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.102.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.102.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.103.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.103.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.103.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.104.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.104.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.104.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.105.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.105.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.105.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.106.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.106.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.106.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.107.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.107.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.107.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.108.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.108.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.108.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.109.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.109.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.109.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.110.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.110.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.110.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.111.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.111.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.111.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.112.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.112.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.112.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.113.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.113.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.113.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.114.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.114.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.114.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.115.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.115.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.115.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.116.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.116.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.116.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.117.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.117.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.117.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.118.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.118.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.118.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.119.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.119.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.119.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.120.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.120.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.120.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.121.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.121.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.121.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.122.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.122.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.122.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.123.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.123.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.123.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.124.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.124.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.124.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.125.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.125.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.125.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.126.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.126.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.126.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.127.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.127.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.127.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.128.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.128.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.128.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.129.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.129.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.129.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.130.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.130.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.130.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.131.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.131.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.131.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.132.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.132.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.132.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.133.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.133.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.133.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.134.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.134.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.134.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.135.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.135.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.135.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.136.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.136.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.136.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.137.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.137.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.137.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.138.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.138.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.138.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.139.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.139.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.139.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.140.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.140.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.140.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.141.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.141.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.141.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.142.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.142.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.142.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.143.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.143.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.143.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.144.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.144.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.144.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.145.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.145.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.145.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.146.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.146.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.146.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.147.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.147.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.147.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.148.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.148.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.148.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.149.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.149.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.149.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.150.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.150.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.150.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.151.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.151.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.151.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.152.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.152.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.152.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.153.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.153.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.153.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.154.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.154.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.154.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.155.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.155.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.155.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.156.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.156.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.156.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.157.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.157.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.157.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.158.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.158.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.158.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.159.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.159.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.159.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.160.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.160.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.160.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.161.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.161.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.161.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.162.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.162.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.162.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.163.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.163.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.163.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.164.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.164.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.164.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.165.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.165.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.165.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.166.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.166.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.166.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.167.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.167.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.167.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.168.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.168.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.168.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.169.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.169.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.169.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.170.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.170.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.170.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.171.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.171.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.171.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.172.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.172.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.172.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.173.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.173.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.173.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.174.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.174.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.174.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.175.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.175.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.175.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.176.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.176.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.176.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.177.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.177.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.177.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.178.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.178.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.178.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.179.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.179.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.179.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.180.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.180.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.180.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.181.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.181.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.181.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.182.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.182.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.182.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.183.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.183.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.183.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.184.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.184.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.184.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.185.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.185.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.185.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.186.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.186.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.186.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.187.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.187.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.187.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.188.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.188.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.188.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.189.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.189.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.189.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.190.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.190.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.190.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.191.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.191.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.191.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.192.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.192.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.192.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.193.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.193.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.193.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.194.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.194.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.194.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.195.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.195.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.195.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.196.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.196.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.196.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.197.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.197.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.197.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.198.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.198.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.198.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.199.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.199.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.199.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.200.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.200.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.200.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.201.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.201.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.201.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.202.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.202.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.202.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.203.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.203.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.203.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.204.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.204.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.204.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.205.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.205.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.205.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.206.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.206.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.206.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.207.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.207.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.207.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.208.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.208.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.208.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.209.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.209.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.209.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.210.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.210.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.210.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.211.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.211.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.211.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.212.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.212.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.212.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.213.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.213.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.213.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.214.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.214.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.214.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.215.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.215.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.215.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.216.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.216.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.216.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.217.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.217.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.217.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.218.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.218.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.218.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.219.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.219.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.219.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.220.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.220.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.220.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.221.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.221.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.221.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.222.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.222.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.222.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.223.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.223.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.223.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.224.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.224.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.224.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.225.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.225.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.225.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.226.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.226.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.226.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.227.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.227.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.227.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.228.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.228.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.228.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.229.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.229.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.229.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.230.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.230.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.230.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.231.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.231.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.231.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.232.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.232.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.232.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.233.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.233.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.233.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.234.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.234.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.234.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.235.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.235.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.235.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.236.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.236.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.236.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.237.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.237.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.237.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.238.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.238.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.238.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.239.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.239.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.239.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.240.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.240.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.240.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.241.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.241.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.241.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.242.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.242.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.242.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.243.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.243.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.243.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.244.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.244.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.244.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.245.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.245.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.245.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.246.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.246.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.246.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.247.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.247.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.247.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.248.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.248.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.248.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.249.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.249.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.249.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.250.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.250.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.250.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.251.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.251.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.251.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.252.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.252.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.252.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.253.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.253.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.253.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.254.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.254.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.254.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.255.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.255.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.255.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.input_layernorm.weight": "model-00040-of-000163.safetensors", + "model.layers.16.post_attention_layernorm.weight": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.q_a_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.q_a_layernorm.weight": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.q_b_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.kv_a_proj_with_mqa.weight": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.kv_a_layernorm.weight": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.kv_b_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.o_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.gate.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.gate.e_score_correction_bias": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.shared_experts.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.shared_experts.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.shared_experts.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.0.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.0.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.0.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.1.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.1.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.1.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.2.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.2.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.2.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.3.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.3.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.3.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.4.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.4.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.4.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.5.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.5.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.5.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.6.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.6.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.6.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.7.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.7.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.7.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.8.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.8.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.8.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.9.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.9.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.9.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.10.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.10.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.10.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.11.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.11.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.11.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.12.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.12.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.12.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.13.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.13.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.13.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.14.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.14.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.14.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.15.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.15.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.15.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.16.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.16.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.16.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.17.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.17.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.17.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.18.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.18.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.18.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.19.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.19.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.19.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.20.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.20.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.20.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.21.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.21.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.21.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.22.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.22.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.22.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.23.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.23.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.23.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.24.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.24.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.24.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.25.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.25.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.25.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.26.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.26.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.26.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.27.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.27.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.27.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.28.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.28.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.28.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.29.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.29.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.29.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.30.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.30.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.30.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.31.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.31.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.31.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.32.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.32.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.32.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.33.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.33.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.33.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.34.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.34.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.34.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.35.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.35.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.35.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.36.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.36.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.36.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.37.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.37.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.37.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.38.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.38.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.38.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.39.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.39.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.39.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.40.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.40.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.40.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.41.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.41.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.41.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.42.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.42.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.42.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.43.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.43.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.43.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.44.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.44.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.44.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.45.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.45.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.45.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.46.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.46.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.46.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.47.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.47.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.47.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.48.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.48.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.48.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.49.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.49.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.49.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.50.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.50.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.50.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.51.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.51.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.51.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.52.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.52.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.52.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.53.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.53.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.53.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.54.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.54.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.54.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.55.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.55.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.55.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.56.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.56.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.56.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.57.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.57.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.57.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.58.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.58.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.58.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.59.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.59.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.59.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.60.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.60.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.60.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.61.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.61.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.61.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.62.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.62.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.62.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.63.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.63.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.63.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.64.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.64.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.64.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.65.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.65.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.65.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.66.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.66.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.66.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.67.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.67.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.67.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.68.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.68.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.68.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.69.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.69.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.69.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.70.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.70.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.70.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.71.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.71.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.71.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.72.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.72.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.72.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.73.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.73.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.73.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.74.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.74.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.74.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.75.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.75.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.75.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.76.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.76.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.76.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.77.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.77.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.77.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.78.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.78.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.78.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.79.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.79.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.79.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.80.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.80.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.80.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.81.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.81.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.81.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.82.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.82.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.82.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.83.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.83.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.83.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.84.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.84.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.84.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.85.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.85.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.85.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.86.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.86.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.86.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.87.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.87.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.87.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.88.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.88.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.88.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.89.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.89.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.89.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.90.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.90.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.90.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.91.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.91.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.91.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.92.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.92.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.92.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.93.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.93.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.93.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.94.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.94.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.94.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.95.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.95.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.95.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.96.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.96.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.96.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.97.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.97.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.97.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.98.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.98.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.98.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.99.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.99.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.99.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.100.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.100.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.100.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.101.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.101.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.101.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.102.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.102.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.102.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.103.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.103.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.103.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.104.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.104.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.104.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.105.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.105.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.105.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.106.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.106.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.106.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.107.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.107.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.107.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.108.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.108.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.108.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.109.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.109.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.109.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.110.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.110.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.110.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.111.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.111.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.111.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.112.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.112.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.112.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.113.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.113.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.113.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.114.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.114.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.114.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.115.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.115.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.115.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.116.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.116.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.116.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.117.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.117.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.117.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.118.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.118.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.118.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.119.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.119.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.119.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.120.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.120.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.120.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.121.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.121.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.121.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.122.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.122.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.122.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.123.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.123.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.123.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.124.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.124.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.124.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.125.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.125.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.125.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.126.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.126.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.126.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.127.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.127.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.127.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.128.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.128.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.128.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.129.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.129.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.129.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.130.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.130.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.130.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.131.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.131.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.131.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.132.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.132.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.132.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.133.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.133.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.133.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.134.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.134.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.134.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.135.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.135.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.135.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.136.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.136.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.136.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.137.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.137.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.137.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.138.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.138.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.138.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.139.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.139.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.139.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.140.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.140.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.140.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.141.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.141.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.141.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.142.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.142.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.142.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.143.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.143.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.143.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.144.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.144.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.144.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.145.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.145.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.145.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.146.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.146.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.146.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.147.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.147.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.147.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.148.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.148.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.148.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.149.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.149.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.149.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.150.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.150.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.150.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.151.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.151.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.151.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.152.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.152.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.152.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.153.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.153.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.153.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.154.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.154.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.154.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.155.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.155.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.155.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.156.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.156.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.156.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.157.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.157.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.157.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.158.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.158.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.158.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.159.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.159.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.159.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.160.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.160.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.160.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.161.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.161.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.161.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.162.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.162.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.162.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.163.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.163.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.163.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.164.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.164.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.164.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.165.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.165.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.165.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.166.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.166.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.166.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.167.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.167.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.167.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.168.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.168.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.168.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.169.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.169.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.169.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.170.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.170.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.170.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.171.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.171.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.171.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.172.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.172.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.172.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.173.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.173.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.173.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.174.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.174.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.174.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.175.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.175.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.175.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.176.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.176.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.176.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.177.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.177.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.177.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.178.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.178.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.178.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.179.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.179.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.179.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.180.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.180.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.180.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.181.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.181.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.181.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.182.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.182.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.182.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.183.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.183.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.183.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.184.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.184.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.184.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.185.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.185.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.185.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.186.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.186.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.186.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.187.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.187.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.187.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.188.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.188.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.188.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.189.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.189.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.189.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.190.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.190.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.190.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.191.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.191.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.191.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.192.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.192.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.192.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.193.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.193.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.193.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.194.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.194.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.194.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.195.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.195.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.195.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.196.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.196.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.196.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.197.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.197.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.197.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.198.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.198.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.198.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.199.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.199.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.199.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.200.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.200.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.200.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.201.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.201.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.201.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.202.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.202.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.202.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.203.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.203.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.203.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.204.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.204.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.204.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.205.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.205.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.205.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.206.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.206.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.206.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.207.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.207.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.207.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.208.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.208.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.208.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.209.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.209.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.209.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.210.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.210.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.210.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.211.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.211.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.211.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.212.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.212.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.212.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.213.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.213.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.213.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.214.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.214.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.214.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.215.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.215.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.215.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.216.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.216.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.216.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.217.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.217.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.217.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.218.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.218.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.218.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.219.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.219.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.219.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.220.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.220.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.220.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.221.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.221.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.221.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.222.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.222.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.222.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.223.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.223.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.223.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.224.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.224.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.224.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.225.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.225.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.225.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.226.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.226.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.226.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.227.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.227.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.227.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.228.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.228.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.228.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.229.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.229.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.229.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.230.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.230.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.230.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.231.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.231.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.231.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.232.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.232.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.232.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.233.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.233.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.233.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.234.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.234.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.234.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.235.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.235.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.235.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.236.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.236.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.236.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.237.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.237.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.237.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.238.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.238.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.238.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.239.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.239.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.239.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.240.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.240.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.240.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.241.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.241.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.241.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.242.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.242.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.242.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.243.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.243.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.243.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.244.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.244.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.244.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.245.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.245.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.245.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.246.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.246.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.246.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.247.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.247.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.247.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.248.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.248.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.248.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.249.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.249.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.249.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.250.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.250.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.250.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.251.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.251.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.251.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.252.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.252.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.252.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.253.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.253.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.17.mlp.experts.253.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.17.mlp.experts.254.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.17.mlp.experts.254.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.17.mlp.experts.254.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.17.mlp.experts.255.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.17.mlp.experts.255.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.17.mlp.experts.255.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.17.input_layernorm.weight": "model-00043-of-000163.safetensors", + "model.layers.17.post_attention_layernorm.weight": "model-00043-of-000163.safetensors", + "model.layers.18.self_attn.q_a_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.self_attn.q_a_layernorm.weight": "model-00043-of-000163.safetensors", + "model.layers.18.self_attn.q_b_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.self_attn.kv_a_proj_with_mqa.weight": "model-00043-of-000163.safetensors", + "model.layers.18.self_attn.kv_a_layernorm.weight": "model-00043-of-000163.safetensors", + "model.layers.18.self_attn.kv_b_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.self_attn.o_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.gate.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.gate.e_score_correction_bias": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.shared_experts.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.shared_experts.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.shared_experts.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.0.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.0.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.0.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.1.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.1.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.1.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.2.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.2.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.2.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.3.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.3.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.3.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.4.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.4.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.4.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.5.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.5.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.5.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.6.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.6.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.6.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.7.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.7.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.7.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.8.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.8.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.8.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.9.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.9.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.9.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.10.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.10.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.10.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.11.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.11.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.11.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.12.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.12.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.12.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.13.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.13.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.13.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.14.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.14.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.14.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.15.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.15.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.15.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.16.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.16.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.16.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.17.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.17.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.17.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.18.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.18.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.18.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.19.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.19.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.19.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.20.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.20.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.20.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.21.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.21.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.21.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.22.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.22.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.22.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.23.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.23.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.23.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.24.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.24.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.24.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.25.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.25.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.25.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.26.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.26.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.26.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.27.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.27.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.27.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.28.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.28.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.28.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.29.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.29.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.29.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.30.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.30.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.30.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.31.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.31.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.31.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.32.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.32.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.32.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.33.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.33.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.33.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.34.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.34.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.34.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.35.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.35.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.35.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.36.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.36.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.36.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.37.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.37.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.37.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.38.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.38.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.38.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.39.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.39.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.39.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.40.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.40.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.40.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.41.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.41.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.41.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.42.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.42.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.42.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.43.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.43.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.43.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.44.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.44.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.44.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.45.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.45.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.45.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.46.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.46.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.46.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.47.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.47.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.47.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.48.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.48.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.48.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.49.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.49.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.49.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.50.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.50.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.50.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.51.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.51.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.51.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.52.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.52.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.52.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.53.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.53.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.53.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.54.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.54.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.54.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.55.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.55.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.55.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.56.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.56.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.56.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.57.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.57.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.57.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.58.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.58.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.58.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.59.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.59.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.59.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.60.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.60.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.60.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.61.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.61.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.61.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.62.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.62.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.62.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.63.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.63.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.63.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.64.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.64.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.64.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.65.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.65.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.65.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.66.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.66.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.66.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.67.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.67.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.67.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.68.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.68.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.68.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.69.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.69.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.69.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.70.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.70.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.70.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.71.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.71.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.71.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.72.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.72.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.72.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.73.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.73.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.73.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.74.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.74.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.74.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.75.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.75.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.75.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.76.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.76.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.76.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.77.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.77.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.77.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.78.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.78.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.78.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.79.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.79.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.79.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.80.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.80.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.80.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.81.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.81.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.81.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.82.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.82.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.82.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.83.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.83.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.83.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.84.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.84.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.84.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.85.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.85.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.85.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.86.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.86.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.86.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.87.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.87.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.87.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.88.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.88.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.88.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.89.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.89.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.89.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.90.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.90.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.90.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.91.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.91.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.91.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.92.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.92.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.92.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.93.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.93.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.93.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.94.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.94.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.94.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.95.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.95.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.95.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.96.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.96.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.96.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.97.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.97.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.97.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.98.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.98.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.98.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.99.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.99.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.99.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.100.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.100.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.100.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.101.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.101.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.101.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.102.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.102.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.102.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.103.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.103.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.103.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.104.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.104.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.104.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.105.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.105.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.105.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.106.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.106.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.106.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.107.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.107.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.107.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.108.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.108.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.108.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.109.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.109.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.109.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.110.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.110.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.110.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.111.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.111.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.111.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.112.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.112.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.112.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.113.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.113.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.113.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.114.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.114.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.114.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.115.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.115.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.115.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.116.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.116.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.116.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.117.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.117.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.117.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.118.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.118.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.118.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.119.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.119.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.119.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.120.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.120.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.120.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.121.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.121.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.121.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.122.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.122.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.122.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.123.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.123.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.123.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.124.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.124.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.124.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.125.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.125.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.125.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.126.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.126.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.126.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.127.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.127.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.127.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.128.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.128.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.128.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.129.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.129.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.129.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.130.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.130.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.130.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.131.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.131.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.131.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.132.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.132.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.132.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.133.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.133.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.133.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.134.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.134.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.134.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.135.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.135.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.135.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.136.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.136.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.136.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.137.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.137.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.137.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.138.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.138.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.138.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.139.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.139.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.139.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.140.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.140.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.140.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.141.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.141.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.141.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.142.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.142.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.142.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.143.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.143.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.143.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.144.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.144.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.144.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.145.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.145.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.145.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.146.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.146.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.146.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.147.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.147.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.147.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.148.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.148.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.148.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.149.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.149.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.149.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.150.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.150.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.150.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.151.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.151.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.151.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.152.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.152.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.152.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.153.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.153.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.153.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.154.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.154.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.154.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.155.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.155.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.155.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.156.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.156.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.156.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.157.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.157.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.157.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.158.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.158.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.158.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.159.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.159.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.159.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.160.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.160.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.160.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.161.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.161.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.161.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.162.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.162.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.162.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.163.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.163.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.163.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.164.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.164.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.164.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.165.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.165.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.165.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.166.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.166.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.166.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.167.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.167.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.167.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.168.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.168.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.168.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.169.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.169.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.169.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.170.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.170.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.170.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.171.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.171.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.171.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.172.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.172.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.172.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.173.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.173.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.173.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.174.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.174.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.174.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.175.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.175.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.175.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.176.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.176.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.176.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.177.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.177.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.177.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.178.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.178.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.178.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.179.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.179.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.179.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.180.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.180.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.180.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.181.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.181.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.181.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.182.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.182.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.182.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.183.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.183.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.183.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.184.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.184.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.184.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.185.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.185.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.185.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.186.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.186.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.186.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.187.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.187.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.187.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.188.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.188.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.188.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.189.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.189.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.189.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.190.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.190.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.190.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.191.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.191.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.191.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.192.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.192.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.192.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.193.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.193.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.193.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.194.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.194.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.194.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.195.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.195.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.195.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.196.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.196.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.196.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.197.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.197.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.197.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.198.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.198.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.198.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.199.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.199.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.199.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.200.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.200.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.200.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.201.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.201.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.201.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.202.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.202.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.202.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.203.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.203.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.203.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.204.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.204.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.204.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.205.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.205.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.205.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.206.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.206.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.206.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.207.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.207.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.207.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.208.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.208.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.208.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.209.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.209.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.209.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.210.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.210.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.210.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.211.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.211.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.211.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.212.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.212.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.212.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.213.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.213.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.213.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.214.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.214.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.214.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.215.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.215.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.215.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.216.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.216.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.216.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.217.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.217.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.217.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.218.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.218.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.218.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.219.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.219.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.219.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.220.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.220.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.220.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.221.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.221.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.221.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.222.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.222.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.222.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.223.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.223.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.223.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.224.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.224.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.224.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.225.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.225.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.225.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.226.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.226.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.226.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.227.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.227.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.227.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.228.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.228.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.228.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.229.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.229.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.229.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.230.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.230.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.230.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.231.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.231.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.231.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.232.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.232.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.232.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.233.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.233.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.233.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.234.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.234.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.234.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.235.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.235.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.235.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.236.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.236.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.236.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.237.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.237.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.237.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.238.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.238.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.238.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.239.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.239.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.239.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.240.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.240.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.240.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.241.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.241.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.241.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.242.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.242.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.242.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.243.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.243.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.243.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.244.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.244.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.244.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.245.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.245.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.245.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.246.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.246.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.246.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.247.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.247.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.247.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.248.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.248.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.248.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.249.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.249.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.249.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.250.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.250.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.250.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.251.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.251.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.251.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.252.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.252.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.252.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.253.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.253.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.253.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.254.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.254.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.254.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.255.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.255.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.255.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.input_layernorm.weight": "model-00045-of-000163.safetensors", + "model.layers.18.post_attention_layernorm.weight": "model-00045-of-000163.safetensors", + "model.layers.19.self_attn.q_a_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.self_attn.q_a_layernorm.weight": "model-00045-of-000163.safetensors", + "model.layers.19.self_attn.q_b_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.self_attn.kv_a_proj_with_mqa.weight": "model-00045-of-000163.safetensors", + "model.layers.19.self_attn.kv_a_layernorm.weight": "model-00045-of-000163.safetensors", + "model.layers.19.self_attn.kv_b_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.self_attn.o_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.gate.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.gate.e_score_correction_bias": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.shared_experts.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.shared_experts.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.shared_experts.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.0.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.0.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.0.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.1.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.1.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.1.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.2.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.2.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.2.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.3.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.3.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.3.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.4.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.4.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.4.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.5.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.5.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.5.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.6.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.6.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.6.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.7.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.7.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.7.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.8.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.8.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.8.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.9.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.9.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.9.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.10.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.10.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.10.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.11.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.11.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.11.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.12.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.12.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.12.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.13.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.13.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.13.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.14.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.14.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.14.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.15.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.15.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.15.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.16.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.16.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.16.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.17.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.17.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.17.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.18.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.18.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.18.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.19.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.19.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.19.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.20.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.20.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.20.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.21.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.21.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.21.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.22.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.22.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.22.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.23.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.23.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.23.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.24.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.24.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.24.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.25.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.25.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.25.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.26.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.26.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.26.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.27.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.27.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.27.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.28.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.28.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.28.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.29.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.29.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.29.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.30.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.30.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.30.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.31.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.31.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.31.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.32.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.32.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.32.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.33.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.33.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.33.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.34.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.34.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.34.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.35.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.35.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.35.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.36.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.36.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.36.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.37.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.37.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.37.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.38.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.38.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.38.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.39.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.39.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.39.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.40.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.40.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.40.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.41.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.41.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.41.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.42.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.42.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.42.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.43.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.43.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.43.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.44.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.44.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.44.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.45.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.45.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.45.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.46.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.46.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.46.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.47.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.47.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.47.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.48.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.48.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.48.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.49.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.49.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.49.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.50.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.50.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.50.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.51.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.51.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.51.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.52.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.52.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.52.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.53.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.53.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.53.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.54.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.54.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.54.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.55.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.55.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.55.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.56.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.56.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.56.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.57.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.57.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.57.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.58.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.58.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.58.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.59.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.59.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.59.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.60.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.60.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.60.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.61.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.61.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.61.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.62.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.62.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.62.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.63.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.63.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.63.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.64.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.64.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.64.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.65.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.65.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.65.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.66.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.66.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.66.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.67.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.67.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.67.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.68.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.68.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.68.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.69.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.69.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.69.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.70.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.70.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.70.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.71.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.71.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.71.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.72.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.72.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.72.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.73.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.73.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.73.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.74.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.74.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.74.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.75.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.75.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.75.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.76.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.76.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.76.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.77.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.77.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.77.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.78.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.78.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.78.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.79.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.79.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.79.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.80.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.80.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.80.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.81.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.81.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.81.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.82.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.82.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.82.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.83.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.83.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.83.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.84.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.84.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.84.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.85.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.85.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.85.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.86.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.86.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.86.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.87.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.87.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.87.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.88.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.88.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.88.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.89.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.89.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.89.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.90.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.90.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.90.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.91.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.91.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.91.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.92.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.92.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.92.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.93.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.93.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.93.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.94.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.94.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.94.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.95.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.95.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.95.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.96.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.96.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.96.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.97.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.97.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.97.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.98.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.98.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.98.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.99.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.99.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.99.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.100.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.100.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.100.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.101.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.101.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.101.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.102.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.102.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.102.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.103.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.103.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.103.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.104.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.104.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.104.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.105.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.105.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.105.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.106.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.106.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.106.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.107.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.107.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.107.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.108.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.108.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.108.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.109.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.109.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.109.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.110.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.110.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.110.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.111.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.111.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.111.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.112.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.112.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.112.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.113.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.113.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.113.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.114.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.114.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.114.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.115.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.115.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.115.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.116.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.116.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.116.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.117.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.117.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.117.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.118.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.118.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.118.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.119.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.119.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.119.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.120.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.120.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.120.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.121.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.121.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.121.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.122.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.122.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.122.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.123.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.123.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.123.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.124.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.124.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.124.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.125.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.125.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.125.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.126.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.126.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.126.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.127.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.127.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.127.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.128.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.128.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.128.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.129.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.129.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.129.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.130.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.130.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.130.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.131.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.131.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.131.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.132.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.132.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.132.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.133.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.133.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.133.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.134.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.134.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.134.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.135.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.135.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.135.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.136.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.136.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.136.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.137.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.137.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.137.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.138.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.138.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.138.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.139.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.139.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.139.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.140.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.140.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.140.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.141.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.141.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.141.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.142.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.142.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.142.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.143.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.143.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.143.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.144.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.144.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.144.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.145.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.145.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.145.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.146.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.146.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.146.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.147.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.147.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.147.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.148.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.148.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.148.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.149.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.149.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.149.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.150.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.150.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.150.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.151.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.151.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.151.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.152.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.152.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.152.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.153.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.153.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.153.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.154.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.154.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.154.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.155.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.155.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.155.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.156.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.156.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.156.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.157.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.157.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.157.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.158.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.158.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.158.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.159.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.159.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.159.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.160.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.160.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.160.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.161.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.161.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.161.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.162.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.162.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.162.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.163.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.163.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.163.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.164.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.164.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.164.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.165.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.165.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.165.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.166.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.166.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.166.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.167.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.167.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.167.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.168.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.168.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.168.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.169.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.169.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.169.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.170.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.170.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.170.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.171.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.171.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.171.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.172.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.172.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.172.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.173.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.173.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.173.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.174.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.174.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.174.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.175.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.175.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.175.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.176.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.176.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.176.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.177.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.177.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.177.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.178.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.178.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.178.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.179.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.179.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.179.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.180.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.180.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.180.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.181.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.181.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.181.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.182.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.182.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.182.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.183.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.183.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.183.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.184.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.184.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.184.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.185.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.185.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.185.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.186.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.186.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.186.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.187.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.187.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.187.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.188.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.188.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.188.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.189.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.189.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.189.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.190.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.190.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.190.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.191.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.191.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.191.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.192.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.192.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.192.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.193.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.193.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.193.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.194.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.194.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.194.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.195.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.195.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.195.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.196.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.196.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.196.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.197.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.197.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.197.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.198.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.198.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.198.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.199.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.199.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.199.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.200.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.200.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.200.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.201.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.201.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.201.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.202.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.202.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.202.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.203.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.203.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.203.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.204.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.204.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.204.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.205.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.205.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.205.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.206.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.206.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.206.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.207.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.207.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.207.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.208.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.208.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.208.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.209.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.209.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.209.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.210.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.210.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.210.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.211.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.211.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.211.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.212.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.212.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.212.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.213.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.213.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.213.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.214.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.214.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.214.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.215.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.215.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.215.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.216.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.216.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.216.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.217.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.217.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.217.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.218.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.218.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.218.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.219.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.219.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.219.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.220.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.220.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.220.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.221.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.221.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.221.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.222.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.222.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.222.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.223.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.223.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.223.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.224.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.224.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.224.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.225.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.225.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.225.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.226.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.226.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.226.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.227.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.227.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.227.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.228.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.228.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.228.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.229.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.229.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.229.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.230.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.230.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.230.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.231.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.231.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.231.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.232.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.232.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.232.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.233.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.233.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.233.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.234.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.234.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.234.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.235.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.235.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.235.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.236.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.236.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.236.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.237.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.237.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.237.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.238.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.238.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.238.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.239.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.239.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.239.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.240.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.240.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.240.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.241.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.241.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.241.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.242.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.242.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.242.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.243.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.243.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.243.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.244.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.244.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.244.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.245.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.245.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.245.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.246.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.246.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.246.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.247.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.247.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.247.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.248.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.248.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.248.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.249.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.249.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.249.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.250.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.250.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.250.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.251.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.251.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.251.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.252.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.252.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.252.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.253.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.253.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.253.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.254.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.254.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.254.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.255.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.255.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.255.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.input_layernorm.weight": "model-00048-of-000163.safetensors", + "model.layers.19.post_attention_layernorm.weight": "model-00048-of-000163.safetensors", + "model.layers.20.self_attn.q_a_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.self_attn.q_a_layernorm.weight": "model-00048-of-000163.safetensors", + "model.layers.20.self_attn.q_b_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.self_attn.kv_a_proj_with_mqa.weight": "model-00048-of-000163.safetensors", + "model.layers.20.self_attn.kv_a_layernorm.weight": "model-00048-of-000163.safetensors", + "model.layers.20.self_attn.kv_b_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.self_attn.o_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.gate.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.gate.e_score_correction_bias": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.shared_experts.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.shared_experts.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.shared_experts.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.0.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.0.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.0.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.1.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.1.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.1.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.2.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.2.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.2.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.3.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.3.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.3.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.4.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.4.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.4.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.5.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.5.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.5.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.6.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.6.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.6.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.7.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.7.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.7.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.8.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.8.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.8.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.9.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.9.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.9.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.10.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.10.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.10.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.11.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.11.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.11.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.12.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.12.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.12.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.13.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.13.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.13.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.14.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.14.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.14.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.15.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.15.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.15.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.16.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.16.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.16.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.17.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.17.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.17.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.18.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.18.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.18.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.19.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.19.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.19.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.20.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.20.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.20.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.21.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.21.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.21.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.22.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.22.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.22.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.23.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.23.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.23.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.24.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.24.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.24.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.25.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.25.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.25.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.26.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.26.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.26.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.27.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.27.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.27.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.28.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.28.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.28.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.29.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.29.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.29.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.30.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.30.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.30.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.31.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.31.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.31.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.32.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.32.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.32.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.33.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.33.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.33.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.34.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.34.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.34.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.35.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.35.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.35.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.36.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.36.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.36.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.37.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.37.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.37.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.38.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.38.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.38.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.39.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.39.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.39.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.40.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.40.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.40.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.41.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.41.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.41.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.42.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.42.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.42.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.43.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.43.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.43.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.44.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.44.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.44.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.45.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.45.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.45.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.46.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.46.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.46.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.47.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.47.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.47.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.48.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.48.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.48.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.49.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.49.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.49.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.50.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.50.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.50.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.51.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.51.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.51.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.52.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.52.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.52.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.53.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.53.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.53.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.54.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.54.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.54.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.55.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.55.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.55.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.56.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.56.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.56.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.57.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.57.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.57.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.58.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.58.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.58.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.59.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.59.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.59.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.60.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.60.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.60.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.61.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.61.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.61.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.62.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.62.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.62.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.63.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.63.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.63.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.64.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.64.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.64.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.65.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.65.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.65.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.66.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.66.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.66.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.67.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.67.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.67.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.68.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.68.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.68.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.69.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.69.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.69.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.70.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.70.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.70.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.71.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.71.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.71.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.72.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.72.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.72.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.73.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.73.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.73.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.74.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.74.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.74.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.75.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.75.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.75.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.76.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.76.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.76.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.77.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.77.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.77.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.78.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.78.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.78.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.79.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.79.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.79.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.80.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.80.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.80.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.81.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.81.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.81.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.82.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.82.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.82.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.83.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.83.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.83.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.84.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.84.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.84.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.85.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.85.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.85.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.86.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.86.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.86.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.87.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.87.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.87.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.88.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.88.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.88.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.89.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.89.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.89.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.90.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.90.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.90.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.91.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.91.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.91.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.92.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.92.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.92.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.93.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.93.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.93.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.94.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.94.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.94.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.95.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.95.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.95.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.96.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.96.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.96.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.97.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.97.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.97.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.98.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.98.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.98.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.99.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.99.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.99.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.100.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.100.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.100.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.101.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.101.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.101.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.102.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.102.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.102.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.103.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.103.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.103.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.104.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.104.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.104.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.105.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.105.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.105.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.106.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.106.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.106.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.107.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.107.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.107.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.108.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.108.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.108.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.109.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.109.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.109.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.110.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.110.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.110.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.111.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.111.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.111.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.112.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.112.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.112.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.113.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.113.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.113.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.114.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.114.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.114.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.115.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.115.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.115.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.116.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.116.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.116.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.117.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.117.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.117.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.118.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.118.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.118.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.119.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.119.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.119.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.120.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.120.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.120.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.121.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.121.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.121.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.122.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.122.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.122.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.123.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.123.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.123.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.124.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.124.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.124.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.125.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.125.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.125.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.126.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.126.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.126.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.127.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.127.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.127.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.128.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.128.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.128.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.129.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.129.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.129.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.130.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.130.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.130.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.131.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.131.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.131.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.132.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.132.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.132.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.133.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.133.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.133.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.134.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.134.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.134.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.135.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.135.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.135.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.136.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.136.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.136.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.137.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.137.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.137.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.138.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.138.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.138.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.139.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.139.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.139.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.140.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.140.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.140.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.141.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.141.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.141.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.142.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.142.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.142.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.143.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.143.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.143.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.144.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.144.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.144.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.145.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.145.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.145.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.146.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.146.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.146.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.147.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.147.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.147.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.148.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.148.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.148.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.149.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.149.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.149.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.150.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.150.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.150.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.151.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.151.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.151.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.152.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.152.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.152.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.153.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.153.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.153.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.154.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.154.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.154.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.155.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.155.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.155.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.156.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.156.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.156.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.157.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.157.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.157.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.158.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.158.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.158.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.159.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.159.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.159.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.160.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.160.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.160.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.161.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.161.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.161.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.162.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.162.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.162.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.163.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.163.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.163.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.164.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.164.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.164.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.165.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.165.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.165.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.166.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.166.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.166.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.167.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.167.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.167.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.168.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.168.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.168.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.169.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.169.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.169.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.170.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.170.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.170.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.171.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.171.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.171.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.172.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.172.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.172.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.173.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.173.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.173.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.174.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.174.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.174.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.175.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.175.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.175.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.176.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.176.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.176.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.177.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.177.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.177.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.178.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.178.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.178.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.179.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.179.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.179.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.180.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.180.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.180.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.181.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.181.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.181.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.182.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.182.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.182.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.183.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.183.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.183.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.184.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.184.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.184.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.185.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.185.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.185.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.186.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.186.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.186.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.187.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.187.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.187.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.188.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.188.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.188.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.189.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.189.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.189.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.190.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.190.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.190.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.191.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.191.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.191.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.192.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.192.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.192.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.193.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.193.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.193.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.194.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.194.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.194.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.195.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.195.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.195.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.196.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.196.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.196.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.197.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.197.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.197.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.198.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.198.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.198.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.199.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.199.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.199.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.200.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.200.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.200.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.201.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.201.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.201.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.202.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.202.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.202.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.203.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.203.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.203.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.204.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.204.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.204.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.205.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.205.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.205.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.206.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.206.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.206.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.207.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.207.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.207.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.208.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.208.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.208.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.209.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.209.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.209.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.210.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.210.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.210.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.211.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.211.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.211.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.212.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.212.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.212.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.213.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.213.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.213.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.214.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.214.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.214.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.215.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.215.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.215.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.216.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.216.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.216.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.217.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.217.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.217.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.218.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.218.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.218.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.219.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.219.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.219.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.220.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.220.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.220.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.221.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.221.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.221.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.222.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.222.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.222.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.223.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.223.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.223.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.224.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.224.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.224.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.225.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.225.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.225.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.226.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.226.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.226.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.227.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.227.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.227.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.228.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.228.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.228.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.229.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.229.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.229.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.230.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.230.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.230.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.231.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.231.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.231.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.232.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.232.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.232.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.233.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.233.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.233.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.234.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.234.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.234.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.235.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.235.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.235.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.236.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.236.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.236.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.237.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.237.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.237.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.238.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.238.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.238.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.239.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.239.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.239.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.240.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.240.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.240.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.241.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.241.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.241.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.242.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.242.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.242.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.243.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.243.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.243.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.244.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.244.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.244.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.245.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.245.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.245.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.246.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.246.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.246.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.247.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.247.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.247.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.248.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.248.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.248.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.249.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.249.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.249.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.250.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.250.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.250.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.251.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.251.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.251.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.252.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.252.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.252.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.253.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.253.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.253.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.254.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.254.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.254.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.255.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.255.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.255.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.input_layernorm.weight": "model-00051-of-000163.safetensors", + "model.layers.20.post_attention_layernorm.weight": "model-00051-of-000163.safetensors", + "model.layers.21.self_attn.q_a_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.self_attn.q_a_layernorm.weight": "model-00051-of-000163.safetensors", + "model.layers.21.self_attn.q_b_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.self_attn.kv_a_proj_with_mqa.weight": "model-00051-of-000163.safetensors", + "model.layers.21.self_attn.kv_a_layernorm.weight": "model-00051-of-000163.safetensors", + "model.layers.21.self_attn.kv_b_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.self_attn.o_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.gate.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.gate.e_score_correction_bias": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.shared_experts.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.shared_experts.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.shared_experts.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.0.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.0.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.0.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.1.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.1.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.1.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.2.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.2.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.2.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.3.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.3.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.3.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.4.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.4.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.4.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.5.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.5.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.5.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.6.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.6.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.6.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.7.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.7.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.7.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.8.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.8.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.8.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.9.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.9.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.9.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.10.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.10.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.10.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.11.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.11.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.11.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.12.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.12.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.12.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.13.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.13.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.13.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.14.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.14.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.14.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.15.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.15.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.15.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.16.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.16.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.16.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.17.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.17.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.17.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.18.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.18.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.18.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.19.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.19.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.19.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.20.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.20.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.20.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.21.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.21.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.21.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.22.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.22.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.22.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.23.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.23.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.23.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.24.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.24.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.24.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.25.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.25.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.25.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.26.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.26.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.26.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.27.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.27.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.27.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.28.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.28.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.28.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.29.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.29.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.29.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.30.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.30.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.30.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.31.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.31.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.31.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.32.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.32.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.32.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.33.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.33.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.33.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.34.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.34.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.34.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.35.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.35.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.35.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.36.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.36.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.36.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.37.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.37.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.37.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.38.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.38.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.38.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.39.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.39.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.39.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.40.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.40.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.40.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.41.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.41.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.41.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.42.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.42.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.42.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.43.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.43.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.43.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.44.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.44.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.44.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.45.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.45.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.45.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.46.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.46.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.46.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.47.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.47.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.47.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.48.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.48.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.48.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.49.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.49.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.49.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.50.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.50.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.50.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.51.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.51.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.51.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.52.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.52.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.52.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.53.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.53.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.53.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.54.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.54.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.54.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.55.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.55.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.55.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.56.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.56.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.56.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.57.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.57.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.57.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.58.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.58.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.58.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.59.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.59.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.59.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.60.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.60.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.60.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.61.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.61.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.61.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.62.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.62.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.62.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.63.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.63.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.63.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.64.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.64.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.64.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.65.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.65.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.65.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.66.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.66.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.66.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.67.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.67.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.67.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.68.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.68.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.68.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.69.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.69.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.69.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.70.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.70.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.70.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.71.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.71.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.71.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.72.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.72.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.72.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.73.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.73.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.73.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.74.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.74.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.74.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.75.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.75.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.75.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.76.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.76.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.76.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.77.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.77.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.77.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.78.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.78.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.78.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.79.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.79.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.79.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.80.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.80.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.80.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.81.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.81.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.81.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.82.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.82.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.82.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.83.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.83.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.83.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.84.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.84.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.84.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.85.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.85.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.85.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.86.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.86.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.86.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.87.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.87.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.87.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.88.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.88.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.88.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.89.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.89.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.89.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.90.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.90.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.90.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.91.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.91.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.91.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.92.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.92.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.92.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.93.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.93.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.93.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.94.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.94.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.94.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.95.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.95.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.95.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.96.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.96.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.96.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.97.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.97.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.97.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.98.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.98.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.98.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.99.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.99.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.99.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.100.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.100.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.100.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.101.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.101.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.101.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.102.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.102.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.102.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.103.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.103.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.103.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.104.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.104.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.104.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.105.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.105.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.105.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.106.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.106.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.106.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.107.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.107.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.107.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.108.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.108.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.108.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.109.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.109.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.109.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.110.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.110.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.110.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.111.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.111.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.111.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.112.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.112.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.112.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.113.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.113.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.113.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.114.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.114.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.114.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.115.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.115.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.115.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.116.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.116.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.116.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.117.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.117.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.117.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.118.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.118.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.118.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.119.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.119.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.119.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.120.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.120.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.120.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.121.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.121.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.121.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.122.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.122.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.122.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.123.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.123.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.123.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.124.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.124.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.124.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.125.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.125.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.125.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.126.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.126.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.126.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.127.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.127.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.127.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.128.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.128.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.128.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.129.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.129.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.129.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.130.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.130.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.130.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.131.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.131.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.131.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.132.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.132.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.132.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.133.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.133.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.133.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.134.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.134.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.134.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.135.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.135.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.135.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.136.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.136.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.136.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.137.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.137.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.137.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.138.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.138.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.138.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.139.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.139.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.139.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.140.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.140.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.140.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.141.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.141.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.141.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.142.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.142.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.142.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.143.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.143.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.143.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.144.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.144.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.144.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.145.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.145.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.145.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.146.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.146.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.146.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.147.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.147.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.147.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.148.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.148.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.148.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.149.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.149.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.149.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.150.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.150.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.150.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.151.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.151.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.151.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.152.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.152.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.152.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.153.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.153.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.153.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.154.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.154.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.154.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.155.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.155.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.155.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.156.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.156.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.156.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.157.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.157.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.157.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.158.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.158.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.158.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.159.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.159.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.159.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.160.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.160.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.160.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.161.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.161.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.161.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.162.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.162.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.162.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.163.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.163.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.163.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.164.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.164.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.164.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.165.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.165.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.165.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.166.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.166.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.166.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.167.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.167.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.167.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.168.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.168.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.168.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.169.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.169.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.169.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.170.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.170.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.170.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.171.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.171.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.171.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.172.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.172.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.172.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.173.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.173.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.173.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.174.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.174.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.174.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.175.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.175.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.175.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.176.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.176.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.176.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.177.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.177.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.177.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.178.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.178.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.178.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.179.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.179.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.179.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.180.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.180.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.180.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.181.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.181.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.181.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.182.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.182.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.182.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.183.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.183.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.183.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.184.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.184.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.184.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.185.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.185.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.185.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.186.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.186.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.186.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.187.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.187.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.187.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.188.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.188.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.188.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.189.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.189.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.189.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.190.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.190.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.190.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.191.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.191.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.191.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.192.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.192.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.192.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.193.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.193.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.193.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.194.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.194.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.194.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.195.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.195.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.195.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.196.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.196.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.196.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.197.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.197.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.197.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.198.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.198.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.198.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.199.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.199.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.199.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.200.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.200.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.200.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.201.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.201.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.201.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.202.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.202.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.202.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.203.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.203.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.203.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.204.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.204.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.204.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.205.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.205.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.205.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.206.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.206.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.206.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.207.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.207.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.207.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.208.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.208.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.208.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.209.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.209.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.209.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.210.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.210.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.210.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.211.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.211.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.211.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.212.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.212.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.212.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.213.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.213.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.213.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.214.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.214.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.214.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.215.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.215.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.215.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.216.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.216.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.216.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.217.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.217.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.217.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.218.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.218.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.218.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.219.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.219.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.219.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.220.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.220.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.220.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.221.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.221.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.221.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.222.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.222.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.222.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.223.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.223.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.223.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.224.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.224.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.224.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.225.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.225.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.225.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.226.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.226.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.226.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.227.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.227.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.227.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.228.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.228.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.228.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.229.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.229.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.229.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.230.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.230.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.230.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.231.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.231.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.231.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.232.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.232.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.232.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.233.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.233.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.233.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.234.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.234.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.234.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.235.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.235.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.235.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.236.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.236.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.236.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.237.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.237.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.237.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.238.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.238.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.238.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.239.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.239.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.239.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.240.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.240.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.240.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.241.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.241.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.241.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.242.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.242.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.242.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.243.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.243.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.243.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.244.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.244.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.244.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.245.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.245.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.245.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.246.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.246.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.246.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.247.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.247.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.247.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.248.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.248.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.248.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.249.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.249.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.249.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.250.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.250.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.250.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.251.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.251.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.251.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.252.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.252.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.252.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.253.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.253.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.253.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.254.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.254.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.254.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.255.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.255.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.255.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.input_layernorm.weight": "model-00053-of-000163.safetensors", + "model.layers.21.post_attention_layernorm.weight": "model-00053-of-000163.safetensors", + "model.layers.22.self_attn.q_a_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.self_attn.q_a_layernorm.weight": "model-00053-of-000163.safetensors", + "model.layers.22.self_attn.q_b_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.self_attn.kv_a_proj_with_mqa.weight": "model-00053-of-000163.safetensors", + "model.layers.22.self_attn.kv_a_layernorm.weight": "model-00053-of-000163.safetensors", + "model.layers.22.self_attn.kv_b_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.self_attn.o_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.gate.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.gate.e_score_correction_bias": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.shared_experts.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.shared_experts.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.shared_experts.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.0.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.0.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.0.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.1.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.1.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.1.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.2.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.2.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.2.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.3.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.3.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.3.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.4.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.4.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.4.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.5.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.5.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.5.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.6.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.6.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.6.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.7.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.7.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.7.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.8.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.8.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.8.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.9.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.9.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.9.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.10.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.10.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.10.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.11.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.11.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.11.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.12.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.12.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.12.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.13.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.13.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.13.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.14.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.14.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.14.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.15.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.15.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.15.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.16.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.16.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.16.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.17.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.17.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.17.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.18.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.18.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.18.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.19.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.19.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.19.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.20.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.20.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.20.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.21.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.21.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.21.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.22.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.22.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.22.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.23.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.23.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.23.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.24.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.24.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.24.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.25.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.25.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.25.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.26.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.26.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.26.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.27.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.27.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.27.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.28.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.28.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.28.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.29.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.29.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.29.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.30.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.30.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.30.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.31.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.31.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.31.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.32.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.32.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.32.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.33.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.33.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.33.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.34.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.34.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.34.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.35.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.35.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.35.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.36.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.36.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.36.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.37.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.37.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.37.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.38.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.38.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.38.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.39.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.39.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.39.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.40.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.40.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.40.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.41.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.41.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.41.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.42.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.42.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.42.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.43.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.43.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.43.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.44.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.44.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.44.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.45.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.45.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.45.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.46.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.46.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.46.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.47.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.47.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.47.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.48.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.48.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.48.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.49.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.49.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.49.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.50.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.50.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.50.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.51.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.51.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.51.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.52.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.52.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.52.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.53.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.53.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.53.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.54.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.54.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.54.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.55.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.55.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.55.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.56.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.56.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.56.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.57.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.57.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.57.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.58.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.58.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.58.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.59.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.59.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.59.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.60.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.60.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.60.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.61.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.61.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.61.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.62.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.62.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.62.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.63.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.63.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.63.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.64.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.64.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.64.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.65.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.65.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.65.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.66.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.66.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.66.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.67.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.67.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.67.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.68.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.68.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.68.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.69.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.69.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.69.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.70.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.70.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.70.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.71.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.71.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.71.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.72.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.72.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.72.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.73.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.73.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.73.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.74.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.74.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.74.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.75.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.75.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.75.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.76.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.76.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.76.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.77.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.77.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.77.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.78.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.78.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.78.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.79.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.79.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.79.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.80.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.80.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.80.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.81.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.81.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.81.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.82.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.82.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.82.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.83.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.83.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.83.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.84.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.84.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.84.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.85.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.85.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.85.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.86.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.86.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.86.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.87.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.87.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.87.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.88.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.88.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.88.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.89.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.89.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.89.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.90.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.90.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.90.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.91.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.91.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.91.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.92.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.92.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.92.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.93.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.93.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.93.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.94.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.94.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.94.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.95.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.95.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.95.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.96.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.96.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.96.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.97.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.97.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.97.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.98.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.98.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.98.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.99.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.99.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.99.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.100.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.100.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.100.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.101.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.101.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.101.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.102.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.102.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.102.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.103.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.103.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.103.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.104.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.104.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.104.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.105.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.105.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.105.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.106.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.106.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.106.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.107.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.107.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.107.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.108.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.108.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.108.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.109.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.109.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.109.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.110.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.110.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.110.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.111.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.111.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.111.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.112.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.112.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.112.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.113.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.113.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.113.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.114.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.114.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.114.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.115.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.115.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.115.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.116.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.116.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.116.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.117.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.117.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.117.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.118.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.118.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.118.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.119.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.119.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.119.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.120.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.120.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.120.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.121.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.121.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.121.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.122.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.122.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.122.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.123.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.123.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.123.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.124.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.124.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.124.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.125.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.125.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.125.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.126.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.126.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.126.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.127.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.127.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.127.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.128.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.128.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.128.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.129.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.129.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.129.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.130.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.130.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.130.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.131.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.131.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.131.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.132.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.132.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.132.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.133.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.133.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.133.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.134.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.134.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.134.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.135.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.135.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.135.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.136.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.136.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.136.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.137.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.137.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.137.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.138.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.138.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.138.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.139.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.139.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.139.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.140.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.140.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.140.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.141.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.141.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.141.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.142.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.142.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.142.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.143.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.143.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.143.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.144.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.144.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.144.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.145.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.145.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.145.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.146.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.146.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.146.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.147.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.147.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.147.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.148.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.148.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.148.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.149.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.149.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.149.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.150.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.150.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.150.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.151.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.151.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.151.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.152.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.152.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.152.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.153.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.153.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.153.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.154.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.154.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.154.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.155.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.155.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.155.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.156.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.156.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.156.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.157.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.157.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.157.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.158.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.158.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.158.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.159.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.159.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.159.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.160.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.160.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.160.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.161.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.161.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.161.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.162.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.162.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.162.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.163.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.163.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.163.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.164.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.164.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.164.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.165.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.165.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.165.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.166.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.166.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.166.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.167.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.167.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.167.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.168.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.168.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.168.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.169.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.169.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.169.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.170.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.170.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.170.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.171.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.171.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.171.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.172.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.172.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.172.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.173.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.173.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.173.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.174.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.174.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.174.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.175.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.175.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.175.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.176.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.176.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.176.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.177.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.177.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.177.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.178.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.178.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.178.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.179.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.179.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.179.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.180.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.180.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.180.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.181.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.181.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.181.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.182.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.182.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.182.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.183.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.183.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.183.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.184.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.184.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.184.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.185.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.185.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.185.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.186.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.186.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.186.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.187.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.187.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.187.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.188.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.188.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.188.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.189.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.189.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.189.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.190.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.190.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.190.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.191.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.191.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.191.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.192.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.192.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.192.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.193.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.193.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.193.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.194.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.194.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.194.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.195.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.195.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.195.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.196.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.196.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.196.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.197.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.197.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.197.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.198.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.198.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.198.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.199.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.199.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.199.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.200.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.200.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.200.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.201.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.201.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.201.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.202.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.202.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.202.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.203.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.203.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.203.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.204.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.204.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.204.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.205.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.205.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.205.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.206.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.206.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.206.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.207.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.207.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.207.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.208.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.208.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.208.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.209.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.209.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.209.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.210.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.210.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.210.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.211.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.211.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.211.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.212.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.212.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.212.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.213.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.213.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.213.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.214.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.214.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.214.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.215.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.215.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.215.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.216.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.216.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.216.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.217.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.217.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.217.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.218.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.218.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.218.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.219.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.219.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.219.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.220.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.220.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.220.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.221.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.221.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.221.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.222.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.222.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.222.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.223.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.223.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.223.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.224.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.224.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.224.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.225.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.225.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.225.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.226.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.226.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.226.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.227.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.227.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.227.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.228.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.228.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.228.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.229.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.229.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.229.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.230.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.230.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.230.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.231.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.231.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.231.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.232.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.232.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.232.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.233.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.233.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.233.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.234.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.234.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.234.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.235.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.235.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.235.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.236.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.236.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.236.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.237.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.237.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.237.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.238.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.238.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.238.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.239.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.239.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.239.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.240.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.240.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.240.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.241.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.241.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.241.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.242.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.242.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.242.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.243.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.243.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.243.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.244.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.244.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.244.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.245.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.245.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.245.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.246.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.246.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.246.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.247.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.247.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.247.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.248.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.248.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.248.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.249.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.249.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.249.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.250.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.250.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.250.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.251.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.251.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.251.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.252.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.252.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.252.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.253.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.253.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.253.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.254.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.254.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.254.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.255.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.255.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.255.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.input_layernorm.weight": "model-00056-of-000163.safetensors", + "model.layers.22.post_attention_layernorm.weight": "model-00056-of-000163.safetensors", + "model.layers.23.self_attn.q_a_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.self_attn.q_a_layernorm.weight": "model-00057-of-000163.safetensors", + "model.layers.23.self_attn.q_b_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.self_attn.kv_a_proj_with_mqa.weight": "model-00057-of-000163.safetensors", + "model.layers.23.self_attn.kv_a_layernorm.weight": "model-00057-of-000163.safetensors", + "model.layers.23.self_attn.kv_b_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.self_attn.o_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.gate.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.gate.e_score_correction_bias": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.shared_experts.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.shared_experts.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.shared_experts.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.0.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.0.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.0.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.1.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.1.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.1.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.2.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.2.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.2.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.3.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.3.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.3.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.4.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.4.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.4.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.5.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.5.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.5.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.6.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.6.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.6.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.7.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.7.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.7.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.8.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.8.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.8.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.9.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.9.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.9.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.10.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.10.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.10.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.11.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.11.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.11.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.12.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.12.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.12.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.13.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.13.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.13.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.14.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.14.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.14.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.15.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.15.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.15.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.16.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.16.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.16.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.17.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.17.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.17.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.18.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.18.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.18.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.19.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.19.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.19.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.20.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.20.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.20.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.21.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.21.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.21.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.22.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.22.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.22.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.23.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.23.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.23.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.24.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.24.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.24.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.25.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.25.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.25.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.26.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.26.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.26.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.27.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.27.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.27.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.28.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.28.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.28.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.29.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.29.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.29.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.30.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.30.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.30.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.31.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.31.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.31.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.32.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.32.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.32.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.33.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.33.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.33.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.34.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.34.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.34.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.35.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.35.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.35.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.36.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.36.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.36.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.37.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.37.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.37.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.38.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.38.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.38.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.39.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.39.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.39.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.40.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.40.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.40.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.41.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.41.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.41.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.42.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.42.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.42.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.43.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.43.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.43.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.44.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.44.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.44.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.45.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.45.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.45.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.46.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.46.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.46.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.47.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.47.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.47.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.48.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.48.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.48.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.49.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.49.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.49.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.50.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.50.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.50.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.51.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.51.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.51.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.52.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.52.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.52.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.53.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.53.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.53.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.54.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.54.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.54.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.55.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.55.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.55.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.56.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.56.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.56.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.57.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.57.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.57.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.58.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.58.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.58.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.59.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.59.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.59.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.60.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.60.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.60.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.61.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.61.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.61.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.62.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.62.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.62.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.63.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.63.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.63.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.64.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.64.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.64.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.65.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.65.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.65.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.66.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.66.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.66.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.67.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.67.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.67.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.68.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.68.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.68.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.69.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.69.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.69.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.70.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.70.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.70.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.71.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.71.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.71.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.72.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.72.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.72.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.73.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.73.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.73.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.74.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.74.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.74.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.75.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.75.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.75.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.76.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.76.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.76.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.77.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.77.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.77.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.78.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.78.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.78.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.79.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.79.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.79.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.80.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.80.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.80.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.81.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.81.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.81.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.82.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.82.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.82.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.83.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.83.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.83.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.84.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.84.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.84.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.85.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.85.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.85.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.86.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.86.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.86.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.87.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.87.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.87.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.88.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.88.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.88.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.89.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.89.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.89.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.90.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.90.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.90.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.91.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.91.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.91.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.92.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.92.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.92.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.93.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.93.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.93.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.94.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.94.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.94.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.95.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.95.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.95.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.96.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.96.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.96.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.97.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.97.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.97.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.98.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.98.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.98.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.99.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.99.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.99.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.100.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.100.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.100.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.101.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.101.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.101.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.102.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.102.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.102.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.103.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.103.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.103.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.104.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.104.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.104.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.105.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.105.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.105.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.106.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.106.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.106.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.107.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.107.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.107.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.108.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.108.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.108.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.109.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.109.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.109.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.110.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.110.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.110.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.111.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.111.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.111.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.112.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.112.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.112.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.113.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.113.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.113.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.114.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.114.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.114.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.115.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.115.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.115.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.116.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.116.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.116.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.117.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.117.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.117.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.118.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.118.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.118.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.119.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.119.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.119.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.120.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.120.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.120.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.121.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.121.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.121.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.122.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.122.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.122.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.123.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.123.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.123.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.124.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.124.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.124.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.125.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.125.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.125.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.126.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.126.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.126.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.127.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.127.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.127.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.128.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.128.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.128.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.129.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.129.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.129.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.130.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.130.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.130.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.131.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.131.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.131.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.132.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.132.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.132.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.133.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.133.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.133.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.134.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.134.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.134.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.135.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.135.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.135.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.136.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.136.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.136.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.137.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.137.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.137.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.138.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.138.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.138.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.139.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.139.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.139.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.140.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.140.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.140.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.141.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.141.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.141.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.142.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.142.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.142.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.143.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.143.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.143.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.144.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.144.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.144.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.145.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.145.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.145.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.146.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.146.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.146.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.147.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.147.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.147.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.148.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.148.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.148.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.149.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.149.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.149.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.150.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.150.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.150.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.151.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.151.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.151.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.152.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.152.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.152.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.153.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.153.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.153.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.154.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.154.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.154.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.155.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.155.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.155.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.156.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.156.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.156.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.157.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.157.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.157.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.158.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.158.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.158.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.159.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.159.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.159.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.160.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.160.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.160.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.161.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.161.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.161.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.162.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.162.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.162.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.163.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.163.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.163.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.164.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.164.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.164.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.165.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.165.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.165.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.166.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.166.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.166.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.167.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.167.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.167.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.168.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.168.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.168.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.169.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.169.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.169.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.170.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.170.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.170.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.171.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.171.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.171.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.172.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.172.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.172.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.173.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.173.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.173.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.174.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.174.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.174.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.175.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.175.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.175.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.176.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.176.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.176.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.177.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.177.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.177.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.178.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.178.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.178.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.179.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.179.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.179.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.180.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.180.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.180.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.181.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.181.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.181.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.182.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.182.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.182.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.183.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.183.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.183.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.184.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.184.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.184.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.185.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.185.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.185.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.186.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.186.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.186.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.187.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.187.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.187.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.188.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.188.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.188.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.189.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.189.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.189.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.190.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.190.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.190.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.191.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.191.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.191.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.192.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.192.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.192.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.193.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.193.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.193.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.194.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.194.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.194.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.195.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.195.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.195.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.196.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.196.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.196.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.197.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.197.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.197.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.198.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.198.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.198.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.199.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.199.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.199.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.200.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.200.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.200.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.201.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.201.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.201.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.202.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.202.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.202.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.203.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.203.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.203.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.204.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.204.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.204.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.205.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.205.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.205.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.206.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.206.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.206.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.207.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.207.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.207.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.208.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.208.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.208.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.209.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.209.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.209.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.210.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.210.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.210.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.211.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.211.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.211.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.212.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.212.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.212.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.213.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.213.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.213.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.214.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.214.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.214.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.215.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.215.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.215.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.216.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.216.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.216.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.217.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.217.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.217.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.218.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.218.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.218.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.219.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.219.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.219.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.220.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.220.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.220.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.221.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.221.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.221.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.222.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.222.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.222.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.223.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.223.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.223.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.224.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.224.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.224.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.225.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.225.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.225.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.226.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.226.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.226.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.227.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.227.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.227.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.228.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.228.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.228.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.229.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.229.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.229.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.230.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.230.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.230.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.231.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.231.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.231.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.232.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.232.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.232.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.233.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.233.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.233.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.234.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.234.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.234.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.235.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.235.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.235.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.236.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.236.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.236.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.237.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.237.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.237.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.238.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.238.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.238.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.239.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.239.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.239.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.240.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.240.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.240.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.241.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.241.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.241.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.242.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.242.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.242.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.243.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.243.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.243.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.244.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.244.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.244.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.245.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.245.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.245.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.246.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.246.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.246.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.247.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.247.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.247.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.248.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.248.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.248.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.249.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.249.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.249.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.250.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.250.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.250.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.251.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.251.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.251.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.252.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.252.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.252.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.253.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.253.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.253.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.254.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.254.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.254.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.255.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.255.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.255.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.input_layernorm.weight": "model-00059-of-000163.safetensors", + "model.layers.23.post_attention_layernorm.weight": "model-00059-of-000163.safetensors", + "model.layers.24.self_attn.q_a_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.self_attn.q_a_layernorm.weight": "model-00059-of-000163.safetensors", + "model.layers.24.self_attn.q_b_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.self_attn.kv_a_proj_with_mqa.weight": "model-00059-of-000163.safetensors", + "model.layers.24.self_attn.kv_a_layernorm.weight": "model-00059-of-000163.safetensors", + "model.layers.24.self_attn.kv_b_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.self_attn.o_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.gate.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.gate.e_score_correction_bias": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.shared_experts.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.shared_experts.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.shared_experts.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.0.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.0.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.0.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.1.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.1.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.1.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.2.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.2.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.2.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.3.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.3.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.3.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.4.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.4.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.4.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.5.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.5.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.5.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.6.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.6.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.6.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.7.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.7.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.7.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.8.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.8.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.8.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.9.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.9.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.9.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.10.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.10.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.10.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.11.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.11.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.11.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.12.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.12.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.12.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.13.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.13.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.13.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.14.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.14.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.14.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.15.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.15.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.15.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.16.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.16.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.16.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.17.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.17.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.17.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.18.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.18.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.18.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.19.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.19.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.19.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.20.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.20.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.20.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.21.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.21.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.21.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.22.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.22.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.22.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.23.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.23.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.23.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.24.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.24.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.24.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.25.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.25.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.25.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.26.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.26.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.26.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.27.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.27.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.27.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.28.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.28.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.28.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.29.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.29.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.29.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.30.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.30.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.30.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.31.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.31.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.31.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.32.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.32.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.32.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.33.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.33.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.33.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.34.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.34.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.34.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.35.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.35.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.35.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.36.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.36.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.36.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.37.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.37.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.37.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.38.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.38.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.38.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.39.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.39.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.39.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.40.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.40.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.40.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.41.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.41.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.41.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.42.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.42.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.42.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.43.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.43.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.43.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.44.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.44.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.44.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.45.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.45.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.45.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.46.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.46.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.46.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.47.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.47.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.47.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.48.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.48.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.48.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.49.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.49.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.49.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.50.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.50.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.50.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.51.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.51.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.51.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.52.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.52.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.52.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.53.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.53.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.53.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.54.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.54.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.54.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.55.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.55.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.55.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.56.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.56.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.56.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.57.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.57.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.57.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.58.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.58.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.58.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.59.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.59.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.59.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.60.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.60.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.60.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.61.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.61.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.61.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.62.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.62.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.62.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.63.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.63.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.63.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.64.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.64.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.64.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.65.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.65.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.65.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.66.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.66.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.66.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.67.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.67.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.67.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.68.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.68.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.68.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.69.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.69.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.69.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.70.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.70.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.70.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.71.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.71.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.71.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.72.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.72.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.72.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.73.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.73.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.73.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.74.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.74.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.74.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.75.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.75.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.75.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.76.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.76.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.76.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.77.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.77.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.77.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.78.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.78.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.78.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.79.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.79.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.79.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.80.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.80.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.80.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.81.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.81.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.81.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.82.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.82.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.82.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.83.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.83.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.83.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.84.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.84.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.84.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.85.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.85.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.85.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.86.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.86.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.86.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.87.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.87.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.87.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.88.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.88.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.88.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.89.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.89.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.89.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.90.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.90.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.90.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.91.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.91.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.91.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.92.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.92.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.92.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.93.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.93.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.93.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.94.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.94.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.94.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.95.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.95.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.95.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.96.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.96.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.96.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.97.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.97.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.97.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.98.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.98.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.98.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.99.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.99.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.99.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.100.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.100.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.100.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.101.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.101.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.101.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.102.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.102.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.102.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.103.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.103.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.103.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.104.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.104.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.104.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.105.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.105.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.105.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.106.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.106.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.106.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.107.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.107.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.107.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.108.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.108.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.108.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.109.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.109.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.109.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.110.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.110.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.110.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.111.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.111.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.111.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.112.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.112.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.112.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.113.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.113.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.113.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.114.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.114.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.114.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.115.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.115.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.115.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.116.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.116.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.116.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.117.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.117.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.117.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.118.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.118.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.118.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.119.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.119.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.119.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.120.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.120.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.120.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.121.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.121.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.121.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.122.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.122.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.122.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.123.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.123.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.123.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.124.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.124.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.124.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.125.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.125.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.125.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.126.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.126.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.126.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.127.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.127.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.127.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.128.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.128.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.128.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.129.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.129.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.129.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.130.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.130.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.130.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.131.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.131.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.131.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.132.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.132.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.132.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.133.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.133.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.133.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.134.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.134.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.134.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.135.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.135.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.135.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.136.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.136.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.136.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.137.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.137.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.137.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.138.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.138.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.138.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.139.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.139.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.139.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.140.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.140.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.140.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.141.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.141.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.141.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.142.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.142.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.142.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.143.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.143.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.143.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.144.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.144.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.144.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.145.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.145.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.145.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.146.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.146.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.146.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.147.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.147.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.147.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.148.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.148.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.148.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.149.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.149.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.149.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.150.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.150.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.150.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.151.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.151.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.151.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.152.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.152.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.152.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.153.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.153.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.153.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.154.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.154.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.154.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.155.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.155.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.155.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.156.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.156.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.156.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.157.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.157.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.157.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.158.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.158.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.158.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.159.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.159.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.159.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.160.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.160.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.160.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.161.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.161.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.161.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.162.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.162.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.162.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.163.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.163.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.163.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.164.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.164.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.164.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.165.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.165.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.165.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.166.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.166.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.166.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.167.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.167.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.167.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.168.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.168.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.168.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.169.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.169.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.169.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.170.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.170.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.170.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.171.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.171.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.171.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.172.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.172.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.172.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.173.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.173.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.173.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.174.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.174.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.174.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.175.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.175.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.175.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.176.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.176.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.176.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.177.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.177.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.177.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.178.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.178.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.178.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.179.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.179.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.179.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.180.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.180.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.180.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.181.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.181.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.181.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.182.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.182.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.182.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.183.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.183.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.183.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.184.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.184.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.184.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.185.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.185.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.185.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.186.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.186.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.186.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.187.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.187.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.187.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.188.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.188.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.188.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.189.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.189.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.189.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.190.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.190.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.190.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.191.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.191.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.191.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.192.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.192.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.192.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.193.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.193.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.193.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.194.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.194.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.194.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.195.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.195.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.195.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.196.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.196.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.196.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.197.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.197.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.197.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.198.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.198.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.198.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.199.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.199.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.199.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.200.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.200.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.200.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.201.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.201.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.201.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.202.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.202.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.202.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.203.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.203.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.203.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.204.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.204.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.204.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.205.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.205.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.205.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.206.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.206.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.206.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.207.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.207.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.207.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.208.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.208.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.208.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.209.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.209.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.209.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.210.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.210.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.210.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.211.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.211.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.211.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.212.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.212.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.212.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.213.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.213.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.213.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.214.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.214.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.214.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.215.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.215.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.215.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.216.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.216.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.216.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.217.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.217.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.217.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.218.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.218.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.218.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.219.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.219.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.219.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.220.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.220.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.220.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.221.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.221.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.221.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.222.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.222.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.222.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.223.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.223.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.223.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.224.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.224.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.224.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.225.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.225.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.225.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.226.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.226.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.226.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.227.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.227.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.227.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.228.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.228.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.228.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.229.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.229.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.229.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.230.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.230.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.230.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.231.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.231.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.231.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.232.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.232.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.232.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.233.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.233.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.233.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.234.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.234.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.234.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.235.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.235.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.235.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.236.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.236.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.236.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.237.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.237.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.237.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.238.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.238.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.238.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.239.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.239.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.239.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.240.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.240.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.240.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.241.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.241.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.241.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.242.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.242.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.242.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.243.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.243.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.243.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.244.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.244.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.244.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.245.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.245.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.245.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.246.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.246.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.246.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.247.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.247.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.247.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.248.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.248.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.248.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.249.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.249.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.249.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.250.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.250.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.250.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.251.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.251.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.251.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.252.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.252.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.252.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.253.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.253.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.253.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.254.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.254.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.254.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.255.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.255.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.255.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.input_layernorm.weight": "model-00062-of-000163.safetensors", + "model.layers.24.post_attention_layernorm.weight": "model-00062-of-000163.safetensors", + "model.layers.25.self_attn.q_a_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.self_attn.q_a_layernorm.weight": "model-00062-of-000163.safetensors", + "model.layers.25.self_attn.q_b_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.self_attn.kv_a_proj_with_mqa.weight": "model-00062-of-000163.safetensors", + "model.layers.25.self_attn.kv_a_layernorm.weight": "model-00062-of-000163.safetensors", + "model.layers.25.self_attn.kv_b_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.self_attn.o_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.gate.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.gate.e_score_correction_bias": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.shared_experts.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.shared_experts.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.shared_experts.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.0.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.0.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.0.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.1.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.1.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.1.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.2.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.2.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.2.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.3.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.3.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.3.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.4.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.4.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.4.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.5.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.5.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.5.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.6.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.6.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.6.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.7.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.7.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.7.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.8.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.8.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.8.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.9.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.9.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.9.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.10.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.10.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.10.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.11.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.11.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.11.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.12.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.12.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.12.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.13.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.13.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.13.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.14.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.14.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.14.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.15.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.15.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.15.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.16.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.16.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.16.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.17.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.17.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.17.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.18.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.18.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.18.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.19.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.19.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.19.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.20.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.20.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.20.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.21.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.21.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.21.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.22.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.22.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.22.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.23.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.23.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.23.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.24.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.24.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.24.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.25.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.25.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.25.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.26.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.26.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.26.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.27.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.27.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.27.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.28.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.28.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.28.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.29.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.29.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.29.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.30.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.30.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.30.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.31.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.31.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.31.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.32.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.32.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.32.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.33.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.33.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.33.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.34.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.34.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.34.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.35.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.35.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.35.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.36.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.36.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.36.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.37.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.37.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.37.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.38.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.38.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.38.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.39.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.39.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.39.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.40.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.40.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.40.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.41.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.41.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.41.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.42.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.42.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.42.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.43.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.43.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.43.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.44.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.44.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.44.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.45.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.45.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.45.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.46.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.46.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.46.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.47.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.47.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.47.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.48.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.48.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.48.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.49.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.49.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.49.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.50.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.50.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.50.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.51.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.51.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.51.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.52.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.52.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.52.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.53.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.53.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.53.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.54.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.54.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.54.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.55.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.55.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.55.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.56.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.56.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.56.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.57.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.57.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.57.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.58.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.58.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.58.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.59.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.59.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.59.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.60.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.60.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.60.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.61.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.61.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.61.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.62.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.62.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.62.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.63.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.63.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.63.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.64.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.64.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.64.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.65.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.65.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.65.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.66.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.66.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.66.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.67.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.67.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.67.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.68.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.68.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.68.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.69.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.69.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.69.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.70.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.70.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.70.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.71.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.71.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.71.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.72.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.72.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.72.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.73.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.73.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.73.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.74.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.74.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.74.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.75.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.75.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.75.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.76.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.76.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.76.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.77.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.77.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.77.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.78.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.78.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.78.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.79.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.79.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.79.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.80.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.80.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.80.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.81.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.81.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.81.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.82.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.82.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.82.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.83.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.83.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.83.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.84.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.84.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.84.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.85.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.85.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.85.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.86.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.86.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.86.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.87.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.87.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.87.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.88.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.88.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.88.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.89.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.89.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.89.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.90.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.90.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.90.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.91.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.91.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.91.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.92.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.92.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.92.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.93.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.93.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.93.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.94.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.94.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.94.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.95.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.95.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.95.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.96.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.96.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.96.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.97.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.97.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.97.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.98.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.98.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.98.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.99.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.99.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.99.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.100.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.100.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.100.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.101.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.101.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.101.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.102.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.102.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.102.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.103.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.103.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.103.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.104.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.104.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.104.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.105.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.105.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.105.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.106.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.106.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.106.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.107.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.107.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.107.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.108.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.108.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.108.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.109.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.109.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.109.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.110.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.110.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.110.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.111.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.111.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.111.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.112.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.112.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.112.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.113.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.113.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.113.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.114.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.114.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.114.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.115.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.115.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.115.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.116.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.116.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.116.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.117.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.117.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.117.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.118.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.118.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.118.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.119.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.119.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.119.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.120.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.120.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.120.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.121.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.121.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.121.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.122.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.122.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.122.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.123.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.123.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.123.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.124.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.124.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.124.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.125.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.125.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.125.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.126.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.126.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.126.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.127.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.127.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.127.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.128.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.128.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.128.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.129.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.129.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.129.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.130.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.130.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.130.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.131.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.131.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.131.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.132.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.132.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.132.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.133.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.133.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.133.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.134.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.134.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.134.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.135.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.135.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.135.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.136.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.136.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.136.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.137.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.137.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.137.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.138.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.138.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.138.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.139.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.139.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.139.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.140.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.140.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.140.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.141.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.141.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.141.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.142.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.142.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.142.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.143.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.143.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.143.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.144.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.144.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.144.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.145.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.145.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.145.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.146.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.146.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.146.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.147.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.147.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.147.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.148.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.148.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.148.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.149.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.149.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.149.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.150.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.150.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.150.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.151.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.151.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.151.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.152.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.152.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.152.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.153.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.153.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.153.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.154.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.154.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.154.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.155.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.155.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.155.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.156.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.156.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.156.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.157.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.157.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.157.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.158.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.158.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.158.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.159.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.159.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.159.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.160.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.160.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.160.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.161.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.161.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.161.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.162.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.162.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.162.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.163.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.163.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.163.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.164.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.164.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.164.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.165.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.165.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.165.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.166.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.166.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.166.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.167.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.167.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.167.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.168.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.168.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.168.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.169.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.169.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.169.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.170.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.170.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.170.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.171.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.171.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.171.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.172.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.172.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.172.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.173.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.173.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.173.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.174.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.174.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.174.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.175.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.175.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.175.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.176.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.176.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.176.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.177.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.177.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.177.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.178.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.178.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.178.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.179.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.179.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.179.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.180.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.180.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.180.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.181.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.181.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.181.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.182.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.182.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.182.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.183.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.183.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.183.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.184.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.184.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.184.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.185.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.185.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.185.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.186.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.186.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.186.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.187.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.187.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.187.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.188.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.188.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.188.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.189.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.189.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.189.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.190.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.190.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.190.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.191.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.191.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.191.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.192.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.192.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.192.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.193.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.193.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.193.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.194.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.194.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.194.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.195.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.195.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.195.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.196.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.196.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.196.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.197.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.197.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.197.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.198.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.198.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.198.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.199.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.199.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.199.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.200.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.200.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.200.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.201.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.201.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.201.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.202.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.202.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.202.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.203.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.203.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.203.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.204.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.204.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.204.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.205.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.205.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.205.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.206.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.206.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.206.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.207.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.207.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.207.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.208.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.208.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.208.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.209.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.209.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.209.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.210.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.210.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.210.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.211.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.211.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.211.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.212.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.212.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.212.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.213.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.213.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.213.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.214.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.214.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.214.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.215.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.215.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.215.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.216.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.216.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.216.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.217.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.217.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.217.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.218.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.218.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.218.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.219.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.219.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.219.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.220.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.220.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.220.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.221.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.221.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.221.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.222.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.222.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.222.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.223.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.223.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.223.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.224.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.224.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.224.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.225.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.225.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.225.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.226.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.226.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.226.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.227.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.227.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.227.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.228.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.228.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.228.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.229.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.229.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.229.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.230.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.230.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.230.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.231.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.231.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.231.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.232.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.232.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.232.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.233.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.233.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.233.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.234.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.234.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.234.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.235.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.235.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.235.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.236.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.236.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.236.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.237.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.237.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.237.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.238.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.238.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.238.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.239.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.239.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.239.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.240.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.240.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.240.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.241.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.241.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.241.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.242.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.242.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.242.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.243.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.243.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.243.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.244.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.244.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.244.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.245.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.245.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.245.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.246.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.246.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.246.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.247.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.247.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.247.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.248.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.248.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.248.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.249.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.249.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.249.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.250.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.250.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.250.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.251.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.251.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.251.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.252.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.252.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.252.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.253.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.253.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.25.mlp.experts.253.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.25.mlp.experts.254.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.25.mlp.experts.254.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.25.mlp.experts.254.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.25.mlp.experts.255.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.25.mlp.experts.255.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.25.mlp.experts.255.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.25.input_layernorm.weight": "model-00065-of-000163.safetensors", + "model.layers.25.post_attention_layernorm.weight": "model-00065-of-000163.safetensors", + "model.layers.26.self_attn.q_a_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.self_attn.q_a_layernorm.weight": "model-00065-of-000163.safetensors", + "model.layers.26.self_attn.q_b_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.self_attn.kv_a_proj_with_mqa.weight": "model-00065-of-000163.safetensors", + "model.layers.26.self_attn.kv_a_layernorm.weight": "model-00065-of-000163.safetensors", + "model.layers.26.self_attn.kv_b_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.self_attn.o_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.gate.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.gate.e_score_correction_bias": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.shared_experts.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.shared_experts.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.shared_experts.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.0.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.0.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.0.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.1.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.1.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.1.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.2.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.2.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.2.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.3.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.3.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.3.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.4.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.4.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.4.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.5.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.5.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.5.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.6.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.6.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.6.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.7.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.7.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.7.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.8.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.8.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.8.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.9.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.9.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.9.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.10.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.10.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.10.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.11.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.11.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.11.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.12.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.12.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.12.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.13.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.13.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.13.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.14.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.14.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.14.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.15.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.15.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.15.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.16.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.16.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.16.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.17.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.17.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.17.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.18.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.18.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.18.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.19.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.19.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.19.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.20.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.20.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.20.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.21.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.21.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.21.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.22.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.22.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.22.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.23.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.23.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.23.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.24.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.24.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.24.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.25.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.25.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.25.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.26.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.26.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.26.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.27.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.27.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.27.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.28.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.28.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.28.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.29.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.29.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.29.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.30.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.30.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.30.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.31.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.31.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.31.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.32.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.32.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.32.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.33.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.33.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.33.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.34.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.34.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.34.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.35.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.35.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.35.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.36.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.36.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.36.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.37.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.37.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.37.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.38.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.38.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.38.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.39.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.39.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.39.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.40.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.40.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.40.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.41.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.41.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.41.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.42.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.42.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.42.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.43.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.43.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.43.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.44.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.44.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.44.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.45.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.45.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.45.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.46.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.46.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.46.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.47.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.47.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.47.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.48.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.48.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.48.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.49.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.49.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.49.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.50.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.50.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.50.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.51.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.51.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.51.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.52.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.52.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.52.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.53.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.53.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.53.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.54.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.54.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.54.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.55.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.55.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.55.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.56.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.56.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.56.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.57.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.57.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.57.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.58.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.58.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.58.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.59.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.59.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.59.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.60.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.60.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.60.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.61.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.61.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.61.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.62.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.62.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.62.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.63.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.63.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.63.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.64.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.64.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.64.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.65.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.65.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.65.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.66.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.66.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.66.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.67.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.67.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.67.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.68.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.68.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.68.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.69.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.69.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.69.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.70.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.70.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.70.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.71.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.71.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.71.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.72.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.72.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.72.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.73.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.73.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.73.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.74.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.74.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.74.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.75.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.75.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.75.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.76.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.76.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.76.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.77.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.77.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.77.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.78.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.78.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.78.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.79.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.79.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.79.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.80.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.80.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.80.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.81.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.81.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.81.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.82.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.82.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.82.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.83.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.83.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.83.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.84.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.84.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.84.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.85.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.85.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.85.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.86.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.86.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.86.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.87.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.87.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.87.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.88.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.88.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.88.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.89.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.89.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.89.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.90.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.90.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.90.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.91.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.91.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.91.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.92.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.92.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.92.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.93.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.93.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.93.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.94.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.94.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.94.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.95.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.95.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.95.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.96.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.96.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.96.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.97.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.97.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.97.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.98.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.98.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.98.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.99.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.99.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.99.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.100.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.100.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.100.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.101.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.101.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.101.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.102.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.102.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.102.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.103.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.103.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.103.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.104.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.104.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.104.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.105.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.105.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.105.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.106.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.106.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.106.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.107.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.107.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.107.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.108.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.108.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.108.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.109.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.109.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.109.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.110.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.110.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.110.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.111.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.111.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.111.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.112.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.112.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.112.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.113.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.113.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.113.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.114.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.114.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.114.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.115.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.115.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.115.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.116.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.116.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.116.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.117.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.117.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.117.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.118.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.118.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.118.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.119.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.119.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.119.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.120.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.120.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.120.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.121.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.121.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.121.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.122.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.122.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.122.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.123.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.123.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.123.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.124.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.124.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.124.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.125.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.125.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.125.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.126.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.126.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.126.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.127.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.127.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.127.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.128.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.128.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.128.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.129.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.129.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.129.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.130.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.130.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.130.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.131.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.131.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.131.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.132.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.132.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.132.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.133.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.133.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.133.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.134.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.134.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.134.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.135.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.135.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.135.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.136.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.136.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.136.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.137.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.137.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.137.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.138.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.138.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.138.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.139.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.139.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.139.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.140.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.140.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.140.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.141.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.141.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.141.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.142.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.142.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.142.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.143.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.143.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.143.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.144.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.144.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.144.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.145.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.145.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.145.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.146.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.146.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.146.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.147.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.147.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.147.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.148.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.148.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.148.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.149.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.149.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.149.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.150.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.150.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.150.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.151.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.151.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.151.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.152.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.152.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.152.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.153.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.153.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.153.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.154.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.154.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.154.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.155.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.155.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.155.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.156.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.156.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.156.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.157.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.157.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.157.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.158.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.158.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.158.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.159.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.159.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.159.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.160.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.160.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.160.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.161.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.161.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.161.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.162.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.162.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.162.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.163.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.163.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.163.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.164.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.164.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.164.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.165.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.165.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.165.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.166.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.166.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.166.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.167.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.167.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.167.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.168.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.168.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.168.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.169.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.169.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.169.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.170.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.170.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.170.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.171.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.171.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.171.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.172.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.172.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.172.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.173.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.173.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.173.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.174.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.174.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.174.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.175.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.175.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.175.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.176.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.176.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.176.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.177.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.177.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.177.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.178.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.178.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.178.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.179.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.179.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.179.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.180.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.180.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.180.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.181.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.181.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.181.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.182.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.182.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.182.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.183.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.183.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.183.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.184.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.184.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.184.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.185.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.185.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.185.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.186.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.186.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.186.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.187.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.187.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.187.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.188.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.188.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.188.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.189.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.189.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.189.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.190.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.190.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.190.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.191.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.191.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.191.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.192.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.192.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.192.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.193.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.193.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.193.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.194.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.194.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.194.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.195.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.195.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.195.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.196.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.196.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.196.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.197.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.197.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.197.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.198.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.198.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.198.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.199.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.199.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.199.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.200.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.200.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.200.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.201.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.201.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.201.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.202.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.202.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.202.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.203.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.203.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.203.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.204.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.204.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.204.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.205.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.205.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.205.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.206.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.206.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.206.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.207.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.207.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.207.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.208.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.208.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.208.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.209.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.209.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.209.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.210.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.210.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.210.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.211.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.211.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.211.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.212.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.212.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.212.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.213.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.213.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.213.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.214.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.214.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.214.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.215.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.215.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.215.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.216.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.216.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.216.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.217.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.217.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.217.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.218.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.218.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.218.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.219.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.219.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.219.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.220.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.220.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.220.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.221.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.221.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.221.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.222.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.222.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.222.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.223.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.223.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.223.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.224.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.224.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.224.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.225.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.225.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.225.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.226.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.226.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.226.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.227.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.227.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.227.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.228.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.228.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.228.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.229.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.229.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.229.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.230.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.230.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.230.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.231.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.231.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.231.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.232.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.232.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.232.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.233.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.233.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.233.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.234.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.234.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.234.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.235.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.235.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.235.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.236.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.236.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.236.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.237.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.237.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.237.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.238.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.238.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.238.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.239.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.239.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.239.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.240.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.240.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.240.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.241.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.241.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.241.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.242.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.242.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.242.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.243.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.243.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.243.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.244.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.244.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.244.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.245.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.245.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.245.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.246.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.246.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.246.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.247.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.247.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.247.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.248.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.248.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.248.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.249.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.249.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.249.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.250.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.250.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.250.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.251.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.251.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.251.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.252.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.252.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.252.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.253.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.253.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.253.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.254.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.254.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.254.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.255.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.255.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.255.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.input_layernorm.weight": "model-00067-of-000163.safetensors", + "model.layers.26.post_attention_layernorm.weight": "model-00067-of-000163.safetensors", + "model.layers.27.self_attn.q_a_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.self_attn.q_a_layernorm.weight": "model-00067-of-000163.safetensors", + "model.layers.27.self_attn.q_b_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.self_attn.kv_a_proj_with_mqa.weight": "model-00067-of-000163.safetensors", + "model.layers.27.self_attn.kv_a_layernorm.weight": "model-00067-of-000163.safetensors", + "model.layers.27.self_attn.kv_b_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.self_attn.o_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.gate.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.gate.e_score_correction_bias": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.shared_experts.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.shared_experts.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.shared_experts.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.0.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.0.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.0.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.1.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.1.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.1.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.2.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.2.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.2.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.3.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.3.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.3.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.4.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.4.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.4.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.5.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.5.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.5.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.6.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.6.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.6.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.7.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.7.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.7.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.8.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.8.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.8.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.9.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.9.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.9.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.10.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.10.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.10.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.11.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.11.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.11.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.12.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.12.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.12.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.13.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.13.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.13.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.14.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.14.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.14.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.15.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.15.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.15.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.16.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.16.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.16.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.17.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.17.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.17.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.18.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.18.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.18.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.19.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.19.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.19.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.20.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.20.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.20.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.21.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.21.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.21.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.22.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.22.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.22.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.23.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.23.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.23.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.24.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.24.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.24.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.25.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.25.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.25.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.26.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.26.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.26.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.27.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.27.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.27.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.28.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.28.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.28.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.29.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.29.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.29.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.30.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.30.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.30.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.31.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.31.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.31.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.32.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.32.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.32.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.33.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.33.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.33.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.34.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.34.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.34.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.35.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.35.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.35.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.36.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.36.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.36.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.37.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.37.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.37.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.38.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.38.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.38.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.39.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.39.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.39.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.40.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.40.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.40.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.41.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.41.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.41.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.42.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.42.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.42.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.43.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.43.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.43.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.44.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.44.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.44.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.45.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.45.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.45.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.46.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.46.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.46.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.47.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.47.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.47.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.48.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.48.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.48.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.49.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.49.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.49.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.50.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.50.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.50.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.51.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.51.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.51.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.52.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.52.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.52.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.53.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.53.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.53.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.54.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.54.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.54.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.55.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.55.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.55.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.56.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.56.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.56.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.57.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.57.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.57.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.58.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.58.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.58.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.59.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.59.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.59.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.60.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.60.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.60.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.61.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.61.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.61.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.62.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.62.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.62.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.63.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.63.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.63.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.64.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.64.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.64.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.65.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.65.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.65.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.66.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.66.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.66.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.67.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.67.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.67.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.68.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.68.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.68.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.69.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.69.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.69.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.70.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.70.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.70.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.71.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.71.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.71.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.72.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.72.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.72.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.73.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.73.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.73.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.74.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.74.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.74.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.75.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.75.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.75.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.76.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.76.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.76.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.77.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.77.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.77.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.78.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.78.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.78.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.79.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.79.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.79.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.80.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.80.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.80.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.81.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.81.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.81.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.82.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.82.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.82.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.83.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.83.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.83.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.84.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.84.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.84.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.85.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.85.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.85.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.86.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.86.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.86.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.87.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.87.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.87.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.88.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.88.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.88.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.89.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.89.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.89.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.90.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.90.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.90.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.91.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.91.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.91.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.92.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.92.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.92.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.93.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.93.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.93.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.94.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.94.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.94.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.95.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.95.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.95.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.96.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.96.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.96.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.97.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.97.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.97.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.98.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.98.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.98.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.99.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.99.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.99.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.100.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.100.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.100.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.101.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.101.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.101.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.102.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.102.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.102.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.103.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.103.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.103.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.104.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.104.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.104.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.105.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.105.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.105.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.106.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.106.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.106.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.107.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.107.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.107.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.108.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.108.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.108.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.109.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.109.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.109.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.110.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.110.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.110.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.111.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.111.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.111.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.112.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.112.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.112.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.113.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.113.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.113.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.114.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.114.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.114.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.115.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.115.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.115.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.116.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.116.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.116.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.117.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.117.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.117.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.118.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.118.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.118.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.119.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.119.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.119.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.120.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.120.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.120.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.121.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.121.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.121.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.122.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.122.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.122.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.123.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.123.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.123.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.124.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.124.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.124.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.125.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.125.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.125.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.126.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.126.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.126.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.127.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.127.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.127.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.128.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.128.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.128.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.129.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.129.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.129.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.130.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.130.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.130.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.131.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.131.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.131.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.132.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.132.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.132.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.133.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.133.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.133.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.134.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.134.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.134.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.135.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.135.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.135.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.136.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.136.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.136.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.137.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.137.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.137.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.138.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.138.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.138.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.139.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.139.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.139.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.140.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.140.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.140.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.141.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.141.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.141.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.142.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.142.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.142.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.143.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.143.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.143.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.144.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.144.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.144.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.145.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.145.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.145.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.146.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.146.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.146.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.147.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.147.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.147.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.148.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.148.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.148.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.149.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.149.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.149.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.150.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.150.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.150.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.151.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.151.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.151.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.152.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.152.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.152.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.153.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.153.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.153.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.154.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.154.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.154.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.155.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.155.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.155.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.156.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.156.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.156.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.157.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.157.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.157.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.158.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.158.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.158.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.159.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.159.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.159.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.160.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.160.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.160.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.161.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.161.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.161.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.162.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.162.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.162.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.163.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.163.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.163.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.164.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.164.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.164.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.165.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.165.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.165.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.166.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.166.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.166.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.167.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.167.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.167.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.168.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.168.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.168.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.169.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.169.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.169.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.170.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.170.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.170.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.171.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.171.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.171.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.172.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.172.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.172.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.173.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.173.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.173.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.174.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.174.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.174.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.175.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.175.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.175.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.176.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.176.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.176.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.177.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.177.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.177.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.178.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.178.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.178.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.179.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.179.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.179.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.180.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.180.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.180.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.181.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.181.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.181.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.182.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.182.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.182.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.183.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.183.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.183.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.184.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.184.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.184.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.185.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.185.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.185.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.186.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.186.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.186.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.187.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.187.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.187.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.188.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.188.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.188.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.189.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.189.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.189.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.190.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.190.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.190.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.191.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.191.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.191.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.192.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.192.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.192.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.193.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.193.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.193.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.194.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.194.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.194.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.195.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.195.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.195.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.196.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.196.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.196.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.197.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.197.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.197.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.198.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.198.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.198.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.199.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.199.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.199.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.200.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.200.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.200.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.201.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.201.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.201.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.202.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.202.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.202.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.203.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.203.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.203.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.204.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.204.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.204.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.205.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.205.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.205.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.206.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.206.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.206.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.207.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.207.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.207.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.208.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.208.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.208.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.209.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.209.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.209.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.210.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.210.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.210.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.211.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.211.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.211.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.212.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.212.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.212.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.213.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.213.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.213.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.214.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.214.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.214.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.215.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.215.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.215.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.216.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.216.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.216.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.217.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.217.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.217.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.218.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.218.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.218.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.219.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.219.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.219.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.220.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.220.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.220.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.221.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.221.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.221.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.222.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.222.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.222.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.223.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.223.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.223.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.224.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.224.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.224.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.225.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.225.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.225.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.226.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.226.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.226.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.227.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.227.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.227.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.228.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.228.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.228.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.229.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.229.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.229.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.230.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.230.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.230.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.231.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.231.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.231.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.232.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.232.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.232.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.233.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.233.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.233.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.234.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.234.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.234.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.235.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.235.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.235.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.236.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.236.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.236.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.237.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.237.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.237.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.238.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.238.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.238.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.239.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.239.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.239.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.240.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.240.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.240.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.241.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.241.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.241.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.242.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.242.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.242.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.243.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.243.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.243.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.244.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.244.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.244.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.245.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.245.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.245.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.246.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.246.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.246.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.247.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.247.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.247.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.248.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.248.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.248.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.249.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.249.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.249.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.250.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.250.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.250.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.251.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.251.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.251.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.252.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.252.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.252.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.253.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.253.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.253.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.254.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.254.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.254.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.255.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.255.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.255.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.input_layernorm.weight": "model-00070-of-000163.safetensors", + "model.layers.27.post_attention_layernorm.weight": "model-00070-of-000163.safetensors", + "model.layers.28.self_attn.q_a_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.self_attn.q_a_layernorm.weight": "model-00070-of-000163.safetensors", + "model.layers.28.self_attn.q_b_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.self_attn.kv_a_proj_with_mqa.weight": "model-00070-of-000163.safetensors", + "model.layers.28.self_attn.kv_a_layernorm.weight": "model-00070-of-000163.safetensors", + "model.layers.28.self_attn.kv_b_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.self_attn.o_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.gate.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.gate.e_score_correction_bias": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.shared_experts.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.shared_experts.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.shared_experts.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.0.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.0.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.0.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.1.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.1.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.1.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.2.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.2.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.2.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.3.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.3.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.3.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.4.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.4.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.4.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.5.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.5.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.5.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.6.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.6.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.6.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.7.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.7.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.7.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.8.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.8.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.8.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.9.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.9.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.9.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.10.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.10.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.10.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.11.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.11.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.11.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.12.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.12.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.12.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.13.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.13.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.13.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.14.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.14.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.14.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.15.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.15.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.15.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.16.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.16.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.16.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.17.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.17.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.17.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.18.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.18.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.18.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.19.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.19.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.19.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.20.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.20.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.20.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.21.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.21.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.21.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.22.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.22.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.22.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.23.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.23.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.23.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.24.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.24.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.24.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.25.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.25.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.25.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.26.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.26.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.26.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.27.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.27.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.27.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.28.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.28.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.28.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.29.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.29.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.29.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.30.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.30.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.30.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.31.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.31.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.31.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.32.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.32.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.32.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.33.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.33.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.33.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.34.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.34.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.34.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.35.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.35.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.35.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.36.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.36.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.36.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.37.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.37.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.37.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.38.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.38.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.38.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.39.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.39.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.39.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.40.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.40.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.40.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.41.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.41.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.41.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.42.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.42.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.42.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.43.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.43.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.43.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.44.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.44.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.44.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.45.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.45.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.45.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.46.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.46.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.46.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.47.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.47.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.47.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.48.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.48.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.48.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.49.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.49.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.49.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.50.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.50.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.50.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.51.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.51.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.51.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.52.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.52.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.52.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.53.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.53.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.53.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.54.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.54.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.54.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.55.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.55.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.55.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.56.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.56.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.56.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.57.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.57.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.57.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.58.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.58.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.58.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.59.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.59.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.59.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.60.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.60.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.60.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.61.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.61.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.61.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.62.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.62.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.62.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.63.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.63.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.63.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.64.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.64.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.64.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.65.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.65.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.65.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.66.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.66.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.66.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.67.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.67.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.67.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.68.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.68.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.68.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.69.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.69.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.69.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.70.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.70.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.70.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.71.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.71.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.71.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.72.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.72.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.72.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.73.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.73.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.73.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.74.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.74.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.74.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.75.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.75.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.75.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.76.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.76.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.76.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.77.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.77.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.77.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.78.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.78.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.78.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.79.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.79.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.79.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.80.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.80.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.80.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.81.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.81.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.81.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.82.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.82.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.82.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.83.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.83.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.83.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.84.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.84.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.84.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.85.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.85.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.85.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.86.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.86.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.86.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.87.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.87.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.87.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.88.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.88.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.88.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.89.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.89.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.89.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.90.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.90.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.90.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.91.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.91.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.91.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.92.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.92.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.92.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.93.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.93.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.93.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.94.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.94.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.94.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.95.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.95.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.95.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.96.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.96.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.96.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.97.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.97.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.97.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.98.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.98.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.98.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.99.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.99.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.99.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.100.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.100.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.100.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.101.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.101.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.101.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.102.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.102.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.102.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.103.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.103.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.103.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.104.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.104.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.104.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.105.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.105.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.105.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.106.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.106.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.106.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.107.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.107.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.107.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.108.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.108.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.108.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.109.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.109.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.109.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.110.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.110.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.110.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.111.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.111.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.111.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.112.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.112.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.112.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.113.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.113.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.113.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.114.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.114.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.114.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.115.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.115.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.115.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.116.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.116.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.116.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.117.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.117.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.117.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.118.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.118.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.118.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.119.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.119.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.119.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.120.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.120.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.120.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.121.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.121.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.121.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.122.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.122.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.122.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.123.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.123.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.123.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.124.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.124.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.124.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.125.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.125.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.125.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.126.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.126.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.126.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.127.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.127.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.127.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.128.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.128.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.128.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.129.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.129.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.129.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.130.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.130.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.130.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.131.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.131.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.131.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.132.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.132.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.132.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.133.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.133.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.133.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.134.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.134.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.134.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.135.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.135.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.135.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.136.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.136.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.136.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.137.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.137.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.137.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.138.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.138.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.138.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.139.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.139.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.139.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.140.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.140.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.140.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.141.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.141.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.141.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.142.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.142.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.142.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.143.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.143.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.143.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.144.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.144.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.144.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.145.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.145.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.145.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.146.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.146.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.146.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.147.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.147.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.147.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.148.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.148.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.148.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.149.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.149.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.149.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.150.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.150.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.150.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.151.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.151.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.151.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.152.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.152.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.152.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.153.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.153.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.153.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.154.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.154.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.154.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.155.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.155.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.155.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.156.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.156.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.156.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.157.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.157.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.157.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.158.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.158.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.158.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.159.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.159.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.159.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.160.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.160.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.160.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.161.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.161.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.161.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.162.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.162.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.162.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.163.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.163.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.163.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.164.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.164.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.164.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.165.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.165.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.165.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.166.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.166.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.166.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.167.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.167.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.167.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.168.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.168.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.168.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.169.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.169.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.169.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.170.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.170.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.170.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.171.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.171.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.171.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.172.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.172.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.172.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.173.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.173.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.173.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.174.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.174.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.174.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.175.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.175.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.175.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.176.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.176.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.176.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.177.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.177.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.177.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.178.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.178.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.178.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.179.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.179.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.179.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.180.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.180.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.180.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.181.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.181.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.181.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.182.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.182.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.182.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.183.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.183.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.183.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.184.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.184.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.184.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.185.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.185.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.185.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.186.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.186.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.186.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.187.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.187.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.187.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.188.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.188.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.188.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.189.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.189.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.189.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.190.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.190.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.190.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.191.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.191.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.191.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.192.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.192.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.192.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.193.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.193.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.193.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.194.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.194.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.194.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.195.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.195.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.195.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.196.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.196.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.196.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.197.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.197.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.197.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.198.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.198.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.198.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.199.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.199.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.199.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.200.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.200.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.200.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.201.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.201.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.201.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.202.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.202.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.202.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.203.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.203.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.203.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.204.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.204.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.204.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.205.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.205.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.205.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.206.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.206.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.206.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.207.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.207.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.207.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.208.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.208.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.208.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.209.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.209.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.209.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.210.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.210.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.210.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.211.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.211.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.211.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.212.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.212.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.212.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.213.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.213.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.213.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.214.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.214.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.214.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.215.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.215.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.215.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.216.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.216.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.216.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.217.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.217.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.217.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.218.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.218.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.218.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.219.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.219.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.219.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.220.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.220.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.220.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.221.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.221.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.221.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.222.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.222.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.222.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.223.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.223.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.223.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.224.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.224.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.224.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.225.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.225.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.225.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.226.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.226.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.226.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.227.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.227.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.227.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.228.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.228.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.228.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.229.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.229.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.229.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.230.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.230.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.230.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.231.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.231.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.231.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.232.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.232.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.232.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.233.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.233.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.233.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.234.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.234.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.234.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.235.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.235.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.235.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.236.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.236.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.236.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.237.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.237.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.237.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.238.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.238.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.238.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.239.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.239.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.239.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.240.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.240.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.240.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.241.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.241.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.241.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.242.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.242.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.242.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.243.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.243.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.243.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.244.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.244.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.244.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.245.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.245.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.245.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.246.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.246.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.246.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.247.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.247.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.247.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.248.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.248.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.248.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.249.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.249.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.249.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.250.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.250.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.250.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.251.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.251.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.251.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.252.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.252.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.252.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.253.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.253.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.253.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.254.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.254.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.254.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.255.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.255.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.255.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.input_layernorm.weight": "model-00073-of-000163.safetensors", + "model.layers.28.post_attention_layernorm.weight": "model-00073-of-000163.safetensors", + "model.layers.29.self_attn.q_a_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.self_attn.q_a_layernorm.weight": "model-00073-of-000163.safetensors", + "model.layers.29.self_attn.q_b_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.self_attn.kv_a_proj_with_mqa.weight": "model-00073-of-000163.safetensors", + "model.layers.29.self_attn.kv_a_layernorm.weight": "model-00073-of-000163.safetensors", + "model.layers.29.self_attn.kv_b_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.self_attn.o_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.gate.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.gate.e_score_correction_bias": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.shared_experts.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.shared_experts.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.shared_experts.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.0.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.0.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.0.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.1.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.1.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.1.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.2.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.2.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.2.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.3.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.3.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.3.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.4.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.4.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.4.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.5.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.5.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.5.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.6.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.6.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.6.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.7.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.7.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.7.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.8.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.8.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.8.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.9.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.9.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.9.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.10.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.10.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.10.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.11.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.11.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.11.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.12.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.12.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.12.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.13.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.13.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.13.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.14.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.14.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.14.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.15.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.15.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.15.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.16.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.16.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.16.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.17.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.17.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.17.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.18.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.18.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.18.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.19.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.19.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.19.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.20.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.20.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.20.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.21.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.21.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.21.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.22.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.22.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.22.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.23.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.23.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.23.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.24.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.24.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.24.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.25.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.25.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.25.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.26.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.26.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.26.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.27.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.27.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.27.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.28.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.28.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.28.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.29.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.29.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.29.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.30.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.30.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.30.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.31.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.31.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.31.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.32.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.32.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.32.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.33.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.33.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.33.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.34.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.34.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.34.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.35.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.35.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.35.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.36.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.36.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.36.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.37.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.37.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.37.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.38.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.38.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.38.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.39.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.39.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.39.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.40.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.40.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.40.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.41.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.41.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.41.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.42.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.42.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.42.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.43.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.43.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.43.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.44.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.44.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.44.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.45.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.45.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.45.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.46.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.46.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.46.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.47.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.47.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.47.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.48.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.48.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.48.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.49.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.49.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.49.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.50.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.50.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.50.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.51.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.51.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.51.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.52.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.52.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.52.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.53.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.53.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.53.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.54.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.54.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.54.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.55.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.55.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.55.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.56.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.56.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.56.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.57.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.57.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.57.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.58.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.58.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.58.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.59.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.59.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.59.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.60.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.60.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.60.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.61.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.61.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.61.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.62.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.62.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.62.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.63.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.63.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.63.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.64.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.64.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.64.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.65.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.65.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.65.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.66.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.66.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.66.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.67.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.67.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.67.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.68.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.68.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.68.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.69.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.69.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.69.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.70.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.70.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.70.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.71.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.71.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.71.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.72.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.72.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.72.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.73.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.73.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.73.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.74.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.74.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.74.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.75.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.75.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.75.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.76.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.76.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.76.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.77.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.77.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.77.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.78.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.78.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.78.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.79.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.79.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.79.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.80.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.80.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.80.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.81.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.81.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.81.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.82.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.82.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.82.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.83.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.83.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.83.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.84.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.84.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.84.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.85.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.85.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.85.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.86.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.86.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.86.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.87.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.87.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.87.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.88.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.88.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.88.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.89.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.89.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.89.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.90.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.90.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.90.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.91.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.91.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.91.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.92.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.92.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.92.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.93.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.93.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.93.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.94.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.94.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.94.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.95.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.95.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.95.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.96.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.96.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.96.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.97.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.97.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.97.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.98.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.98.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.98.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.99.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.99.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.99.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.100.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.100.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.100.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.101.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.101.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.101.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.102.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.102.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.102.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.103.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.103.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.103.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.104.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.104.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.104.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.105.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.105.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.105.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.106.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.106.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.106.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.107.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.107.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.107.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.108.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.108.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.108.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.109.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.109.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.109.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.110.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.110.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.110.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.111.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.111.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.111.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.112.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.112.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.112.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.113.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.113.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.113.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.114.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.114.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.114.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.115.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.115.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.115.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.116.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.116.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.116.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.117.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.117.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.117.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.118.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.118.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.118.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.119.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.119.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.119.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.120.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.120.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.120.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.121.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.121.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.121.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.122.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.122.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.122.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.123.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.123.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.123.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.124.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.124.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.124.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.125.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.125.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.125.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.126.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.126.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.126.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.127.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.127.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.127.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.128.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.128.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.128.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.129.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.129.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.129.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.130.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.130.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.130.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.131.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.131.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.131.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.132.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.132.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.132.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.133.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.133.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.133.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.134.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.134.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.134.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.135.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.135.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.135.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.136.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.136.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.136.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.137.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.137.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.137.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.138.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.138.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.138.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.139.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.139.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.139.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.140.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.140.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.140.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.141.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.141.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.141.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.142.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.142.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.142.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.143.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.143.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.143.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.144.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.144.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.144.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.145.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.145.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.145.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.146.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.146.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.146.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.147.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.147.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.147.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.148.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.148.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.148.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.149.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.149.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.149.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.150.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.150.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.150.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.151.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.151.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.151.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.152.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.152.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.152.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.153.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.153.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.153.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.154.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.154.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.154.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.155.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.155.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.155.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.156.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.156.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.156.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.157.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.157.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.157.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.158.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.158.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.158.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.159.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.159.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.159.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.160.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.160.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.160.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.161.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.161.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.161.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.162.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.162.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.162.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.163.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.163.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.163.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.164.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.164.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.164.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.165.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.165.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.165.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.166.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.166.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.166.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.167.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.167.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.167.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.168.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.168.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.168.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.169.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.169.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.169.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.170.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.170.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.170.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.171.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.171.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.171.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.172.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.172.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.172.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.173.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.173.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.173.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.174.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.174.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.174.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.175.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.175.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.175.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.176.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.176.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.176.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.177.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.177.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.177.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.178.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.178.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.178.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.179.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.179.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.179.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.180.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.180.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.180.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.181.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.181.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.181.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.182.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.182.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.182.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.183.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.183.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.183.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.184.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.184.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.184.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.185.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.185.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.185.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.186.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.186.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.186.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.187.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.187.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.187.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.188.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.188.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.188.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.189.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.189.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.189.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.190.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.190.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.190.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.191.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.191.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.191.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.192.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.192.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.192.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.193.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.193.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.193.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.194.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.194.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.194.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.195.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.195.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.195.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.196.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.196.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.196.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.197.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.197.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.197.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.198.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.198.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.198.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.199.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.199.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.199.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.200.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.200.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.200.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.201.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.201.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.201.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.202.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.202.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.202.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.203.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.203.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.203.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.204.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.204.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.204.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.205.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.205.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.205.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.206.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.206.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.206.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.207.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.207.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.207.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.208.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.208.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.208.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.209.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.209.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.209.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.210.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.210.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.210.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.211.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.211.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.211.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.212.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.212.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.212.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.213.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.213.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.213.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.214.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.214.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.214.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.215.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.215.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.215.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.216.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.216.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.216.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.217.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.217.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.217.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.218.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.218.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.218.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.219.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.219.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.219.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.220.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.220.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.220.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.221.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.221.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.221.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.222.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.222.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.222.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.223.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.223.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.223.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.224.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.224.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.224.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.225.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.225.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.225.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.226.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.226.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.226.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.227.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.227.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.227.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.228.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.228.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.228.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.229.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.229.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.229.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.230.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.230.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.230.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.231.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.231.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.231.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.232.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.232.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.232.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.233.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.233.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.233.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.234.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.234.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.234.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.235.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.235.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.235.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.236.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.236.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.236.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.237.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.237.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.237.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.238.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.238.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.238.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.239.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.239.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.239.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.240.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.240.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.240.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.241.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.241.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.241.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.242.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.242.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.242.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.243.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.243.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.243.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.244.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.244.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.244.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.245.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.245.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.245.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.246.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.246.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.246.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.247.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.247.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.247.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.248.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.248.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.248.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.249.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.249.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.249.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.250.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.250.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.250.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.251.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.251.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.251.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.252.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.252.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.252.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.253.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.253.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.253.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.254.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.254.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.254.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.255.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.255.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.255.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.input_layernorm.weight": "model-00075-of-000163.safetensors", + "model.layers.29.post_attention_layernorm.weight": "model-00075-of-000163.safetensors", + "model.layers.30.self_attn.q_a_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.self_attn.q_a_layernorm.weight": "model-00075-of-000163.safetensors", + "model.layers.30.self_attn.q_b_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.self_attn.kv_a_proj_with_mqa.weight": "model-00075-of-000163.safetensors", + "model.layers.30.self_attn.kv_a_layernorm.weight": "model-00075-of-000163.safetensors", + "model.layers.30.self_attn.kv_b_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.self_attn.o_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.gate.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.gate.e_score_correction_bias": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.shared_experts.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.shared_experts.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.shared_experts.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.0.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.0.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.0.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.1.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.1.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.1.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.2.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.2.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.2.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.3.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.3.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.3.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.4.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.4.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.4.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.5.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.5.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.5.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.6.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.6.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.6.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.7.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.7.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.7.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.8.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.8.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.8.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.9.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.9.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.9.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.10.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.10.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.10.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.11.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.11.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.11.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.12.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.12.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.12.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.13.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.13.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.13.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.14.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.14.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.14.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.15.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.15.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.15.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.16.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.16.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.16.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.17.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.17.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.17.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.18.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.18.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.18.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.19.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.19.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.19.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.20.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.20.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.20.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.21.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.21.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.21.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.22.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.22.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.22.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.23.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.23.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.23.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.24.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.24.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.24.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.25.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.25.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.25.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.26.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.26.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.26.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.27.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.27.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.27.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.28.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.28.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.28.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.29.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.29.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.29.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.30.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.30.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.30.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.31.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.31.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.31.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.32.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.32.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.32.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.33.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.33.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.33.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.34.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.34.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.34.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.35.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.35.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.35.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.36.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.36.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.36.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.37.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.37.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.37.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.38.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.38.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.38.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.39.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.39.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.39.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.40.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.40.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.40.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.41.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.41.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.41.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.42.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.42.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.42.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.43.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.43.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.43.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.44.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.44.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.44.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.45.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.45.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.45.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.46.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.46.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.46.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.47.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.47.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.47.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.48.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.48.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.48.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.49.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.49.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.49.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.50.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.50.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.50.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.51.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.51.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.51.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.52.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.52.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.52.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.53.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.53.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.53.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.54.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.54.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.54.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.55.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.55.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.55.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.56.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.56.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.56.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.57.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.57.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.57.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.58.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.58.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.58.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.59.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.59.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.59.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.60.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.60.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.60.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.61.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.61.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.61.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.62.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.62.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.62.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.63.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.63.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.63.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.64.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.64.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.64.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.65.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.65.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.65.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.66.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.66.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.66.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.67.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.67.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.67.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.68.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.68.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.68.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.69.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.69.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.69.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.70.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.70.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.70.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.71.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.71.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.71.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.72.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.72.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.72.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.73.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.73.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.73.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.74.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.74.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.74.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.75.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.75.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.75.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.76.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.76.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.76.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.77.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.77.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.77.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.78.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.78.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.78.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.79.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.79.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.79.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.80.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.80.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.80.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.81.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.81.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.81.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.82.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.82.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.82.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.83.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.83.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.83.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.84.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.84.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.84.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.85.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.85.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.85.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.86.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.86.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.86.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.87.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.87.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.87.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.88.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.88.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.88.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.89.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.89.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.89.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.90.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.90.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.90.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.91.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.91.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.91.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.92.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.92.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.92.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.93.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.93.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.93.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.94.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.94.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.94.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.95.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.95.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.95.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.96.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.96.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.96.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.97.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.97.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.97.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.98.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.98.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.98.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.99.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.99.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.99.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.100.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.100.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.100.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.101.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.101.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.101.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.102.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.102.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.102.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.103.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.103.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.103.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.104.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.104.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.104.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.105.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.105.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.105.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.106.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.106.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.106.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.107.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.107.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.107.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.108.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.108.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.108.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.109.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.109.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.109.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.110.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.110.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.110.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.111.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.111.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.111.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.112.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.112.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.112.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.113.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.113.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.113.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.114.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.114.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.114.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.115.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.115.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.115.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.116.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.116.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.116.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.117.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.117.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.117.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.118.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.118.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.118.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.119.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.119.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.119.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.120.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.120.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.120.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.121.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.121.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.121.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.122.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.122.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.122.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.123.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.123.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.123.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.124.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.124.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.124.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.125.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.125.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.125.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.126.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.126.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.126.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.127.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.127.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.127.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.128.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.128.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.128.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.129.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.129.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.129.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.130.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.130.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.130.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.131.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.131.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.131.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.132.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.132.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.132.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.133.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.133.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.133.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.134.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.134.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.134.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.135.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.135.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.135.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.136.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.136.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.136.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.137.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.137.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.137.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.138.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.138.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.138.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.139.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.139.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.139.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.140.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.140.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.140.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.141.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.141.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.141.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.142.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.142.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.142.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.143.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.143.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.143.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.144.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.144.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.144.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.145.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.145.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.145.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.146.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.146.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.146.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.147.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.147.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.147.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.148.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.148.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.148.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.149.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.149.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.149.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.150.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.150.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.150.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.151.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.151.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.151.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.152.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.152.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.152.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.153.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.153.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.153.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.154.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.154.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.154.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.155.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.155.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.155.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.156.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.156.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.156.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.157.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.157.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.157.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.158.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.158.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.158.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.159.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.159.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.159.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.160.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.160.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.160.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.161.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.161.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.161.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.162.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.162.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.162.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.163.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.163.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.163.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.164.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.164.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.164.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.165.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.165.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.165.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.166.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.166.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.166.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.167.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.167.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.167.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.168.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.168.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.168.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.169.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.169.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.169.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.170.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.170.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.170.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.171.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.171.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.171.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.172.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.172.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.172.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.173.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.173.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.173.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.174.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.174.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.174.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.175.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.175.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.175.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.176.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.176.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.176.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.177.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.177.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.177.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.178.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.178.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.178.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.179.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.179.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.179.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.180.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.180.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.180.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.181.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.181.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.181.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.182.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.182.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.182.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.183.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.183.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.183.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.184.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.184.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.184.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.185.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.185.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.185.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.186.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.186.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.186.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.187.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.187.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.187.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.188.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.188.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.188.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.189.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.189.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.189.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.190.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.190.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.190.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.191.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.191.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.191.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.192.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.192.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.192.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.193.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.193.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.193.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.194.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.194.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.194.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.195.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.195.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.195.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.196.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.196.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.196.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.197.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.197.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.197.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.198.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.198.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.198.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.199.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.199.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.199.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.200.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.200.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.200.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.201.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.201.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.201.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.202.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.202.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.202.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.203.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.203.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.203.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.204.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.204.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.204.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.205.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.205.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.205.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.206.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.206.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.206.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.207.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.207.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.207.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.208.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.208.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.208.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.209.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.209.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.209.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.210.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.210.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.210.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.211.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.211.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.211.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.212.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.212.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.212.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.213.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.213.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.213.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.214.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.214.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.214.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.215.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.215.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.215.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.216.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.216.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.216.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.217.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.217.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.217.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.218.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.218.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.218.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.219.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.219.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.219.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.220.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.220.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.220.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.221.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.221.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.221.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.222.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.222.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.222.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.223.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.223.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.223.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.224.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.224.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.224.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.225.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.225.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.225.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.226.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.226.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.226.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.227.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.227.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.227.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.228.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.228.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.228.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.229.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.229.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.229.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.230.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.230.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.230.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.231.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.231.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.231.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.232.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.232.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.232.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.233.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.233.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.233.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.234.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.234.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.234.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.235.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.235.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.235.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.236.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.236.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.236.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.237.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.237.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.237.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.238.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.238.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.238.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.239.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.239.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.239.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.240.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.240.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.240.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.241.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.241.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.241.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.242.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.242.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.242.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.243.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.243.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.243.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.244.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.244.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.244.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.245.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.245.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.245.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.246.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.246.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.246.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.247.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.247.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.247.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.248.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.248.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.248.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.249.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.249.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.249.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.250.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.250.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.250.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.251.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.251.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.251.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.252.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.252.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.252.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.253.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.253.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.253.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.254.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.254.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.254.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.255.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.255.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.255.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.input_layernorm.weight": "model-00078-of-000163.safetensors", + "model.layers.30.post_attention_layernorm.weight": "model-00078-of-000163.safetensors", + "model.layers.31.self_attn.q_a_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.self_attn.q_a_layernorm.weight": "model-00079-of-000163.safetensors", + "model.layers.31.self_attn.q_b_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.self_attn.kv_a_proj_with_mqa.weight": "model-00079-of-000163.safetensors", + "model.layers.31.self_attn.kv_a_layernorm.weight": "model-00079-of-000163.safetensors", + "model.layers.31.self_attn.kv_b_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.self_attn.o_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.gate.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.gate.e_score_correction_bias": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.shared_experts.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.shared_experts.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.shared_experts.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.0.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.0.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.0.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.1.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.1.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.1.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.2.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.2.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.2.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.3.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.3.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.3.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.4.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.4.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.4.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.5.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.5.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.5.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.6.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.6.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.6.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.7.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.7.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.7.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.8.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.8.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.8.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.9.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.9.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.9.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.10.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.10.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.10.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.11.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.11.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.11.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.12.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.12.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.12.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.13.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.13.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.13.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.14.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.14.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.14.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.15.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.15.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.15.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.16.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.16.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.16.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.17.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.17.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.17.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.18.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.18.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.18.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.19.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.19.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.19.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.20.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.20.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.20.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.21.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.21.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.21.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.22.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.22.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.22.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.23.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.23.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.23.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.24.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.24.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.24.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.25.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.25.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.25.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.26.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.26.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.26.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.27.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.27.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.27.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.28.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.28.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.28.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.29.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.29.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.29.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.30.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.30.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.30.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.31.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.31.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.31.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.32.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.32.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.32.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.33.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.33.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.33.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.34.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.34.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.34.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.35.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.35.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.35.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.36.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.36.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.36.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.37.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.37.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.37.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.38.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.38.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.38.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.39.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.39.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.39.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.40.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.40.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.40.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.41.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.41.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.41.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.42.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.42.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.42.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.43.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.43.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.43.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.44.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.44.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.44.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.45.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.45.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.45.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.46.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.46.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.46.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.47.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.47.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.47.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.48.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.48.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.48.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.49.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.49.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.49.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.50.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.50.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.50.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.51.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.51.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.51.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.52.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.52.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.52.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.53.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.53.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.53.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.54.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.54.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.54.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.55.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.55.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.55.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.56.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.56.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.56.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.57.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.57.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.57.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.58.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.58.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.58.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.59.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.59.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.59.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.60.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.60.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.60.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.61.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.61.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.61.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.62.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.62.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.62.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.63.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.63.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.63.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.64.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.64.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.64.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.65.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.65.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.65.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.66.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.66.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.66.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.67.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.67.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.67.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.68.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.68.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.68.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.69.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.69.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.69.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.70.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.70.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.70.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.71.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.71.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.71.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.72.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.72.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.72.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.73.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.73.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.73.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.74.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.74.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.74.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.75.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.75.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.75.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.76.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.76.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.76.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.77.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.77.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.77.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.78.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.78.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.78.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.79.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.79.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.79.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.80.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.80.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.80.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.81.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.81.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.81.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.82.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.82.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.82.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.83.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.83.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.83.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.84.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.84.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.84.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.85.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.85.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.85.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.86.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.86.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.86.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.87.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.87.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.87.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.88.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.88.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.88.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.89.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.89.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.89.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.90.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.90.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.90.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.91.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.91.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.91.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.92.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.92.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.92.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.93.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.93.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.93.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.94.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.94.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.94.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.95.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.95.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.95.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.96.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.96.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.96.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.97.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.97.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.97.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.98.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.98.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.98.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.99.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.99.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.99.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.100.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.100.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.100.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.101.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.101.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.101.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.102.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.102.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.102.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.103.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.103.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.103.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.104.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.104.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.104.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.105.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.105.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.105.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.106.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.106.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.106.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.107.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.107.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.107.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.108.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.108.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.108.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.109.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.109.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.109.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.110.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.110.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.110.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.111.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.111.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.111.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.112.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.112.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.112.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.113.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.113.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.113.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.114.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.114.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.114.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.115.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.115.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.115.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.116.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.116.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.116.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.117.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.117.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.117.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.118.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.118.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.118.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.119.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.119.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.119.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.120.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.120.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.120.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.121.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.121.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.121.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.122.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.122.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.122.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.123.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.123.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.123.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.124.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.124.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.124.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.125.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.125.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.125.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.126.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.126.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.126.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.127.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.127.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.127.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.128.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.128.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.128.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.129.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.129.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.129.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.130.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.130.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.130.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.131.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.131.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.131.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.132.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.132.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.132.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.133.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.133.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.133.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.134.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.134.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.134.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.135.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.135.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.135.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.136.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.136.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.136.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.137.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.137.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.137.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.138.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.138.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.138.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.139.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.139.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.139.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.140.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.140.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.140.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.141.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.141.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.141.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.142.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.142.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.142.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.143.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.143.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.143.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.144.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.144.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.144.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.145.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.145.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.145.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.146.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.146.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.146.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.147.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.147.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.147.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.148.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.148.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.148.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.149.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.149.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.149.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.150.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.150.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.150.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.151.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.151.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.151.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.152.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.152.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.152.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.153.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.153.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.153.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.154.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.154.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.154.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.155.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.155.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.155.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.156.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.156.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.156.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.157.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.157.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.157.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.158.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.158.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.158.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.159.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.159.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.159.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.160.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.160.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.160.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.161.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.161.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.161.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.162.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.162.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.162.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.163.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.163.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.163.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.164.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.164.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.164.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.165.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.165.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.165.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.166.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.166.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.166.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.167.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.167.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.167.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.168.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.168.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.168.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.169.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.169.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.169.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.170.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.170.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.170.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.171.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.171.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.171.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.172.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.172.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.172.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.173.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.173.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.173.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.174.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.174.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.174.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.175.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.175.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.175.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.176.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.176.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.176.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.177.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.177.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.177.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.178.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.178.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.178.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.179.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.179.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.179.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.180.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.180.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.180.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.181.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.181.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.181.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.182.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.182.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.182.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.183.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.183.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.183.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.184.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.184.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.184.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.185.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.185.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.185.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.186.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.186.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.186.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.187.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.187.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.187.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.188.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.188.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.188.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.189.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.189.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.189.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.190.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.190.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.190.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.191.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.191.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.191.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.192.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.192.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.192.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.193.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.193.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.193.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.194.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.194.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.194.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.195.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.195.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.195.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.196.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.196.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.196.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.197.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.197.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.197.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.198.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.198.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.198.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.199.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.199.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.199.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.200.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.200.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.200.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.201.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.201.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.201.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.202.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.202.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.202.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.203.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.203.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.203.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.204.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.204.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.204.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.205.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.205.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.205.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.206.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.206.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.206.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.207.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.207.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.207.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.208.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.208.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.208.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.209.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.209.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.209.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.210.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.210.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.210.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.211.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.211.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.211.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.212.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.212.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.212.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.213.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.213.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.213.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.214.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.214.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.214.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.215.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.215.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.215.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.216.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.216.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.216.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.217.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.217.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.217.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.218.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.218.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.218.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.219.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.219.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.219.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.220.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.220.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.220.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.221.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.221.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.221.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.222.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.222.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.222.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.223.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.223.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.223.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.224.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.224.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.224.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.225.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.225.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.225.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.226.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.226.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.226.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.227.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.227.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.227.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.228.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.228.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.228.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.229.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.229.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.229.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.230.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.230.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.230.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.231.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.231.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.231.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.232.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.232.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.232.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.233.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.233.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.233.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.234.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.234.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.234.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.235.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.235.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.235.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.236.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.236.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.236.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.237.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.237.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.237.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.238.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.238.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.238.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.239.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.239.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.239.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.240.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.240.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.240.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.241.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.241.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.241.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.242.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.242.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.242.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.243.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.243.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.243.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.244.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.244.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.244.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.245.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.245.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.245.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.246.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.246.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.246.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.247.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.247.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.247.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.248.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.248.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.248.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.249.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.249.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.249.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.250.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.250.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.250.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.251.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.251.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.251.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.252.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.252.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.252.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.253.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.253.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.253.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.254.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.254.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.254.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.255.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.255.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.255.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.input_layernorm.weight": "model-00081-of-000163.safetensors", + "model.layers.31.post_attention_layernorm.weight": "model-00081-of-000163.safetensors", + "model.layers.32.self_attn.q_a_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.self_attn.q_a_layernorm.weight": "model-00081-of-000163.safetensors", + "model.layers.32.self_attn.q_b_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.self_attn.kv_a_proj_with_mqa.weight": "model-00081-of-000163.safetensors", + "model.layers.32.self_attn.kv_a_layernorm.weight": "model-00081-of-000163.safetensors", + "model.layers.32.self_attn.kv_b_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.self_attn.o_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.gate.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.gate.e_score_correction_bias": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.shared_experts.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.shared_experts.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.shared_experts.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.0.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.0.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.0.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.1.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.1.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.1.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.2.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.2.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.2.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.3.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.3.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.3.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.4.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.4.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.4.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.5.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.5.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.5.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.6.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.6.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.6.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.7.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.7.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.7.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.8.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.8.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.8.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.9.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.9.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.9.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.10.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.10.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.10.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.11.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.11.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.11.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.12.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.12.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.12.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.13.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.13.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.13.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.14.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.14.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.14.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.15.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.15.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.15.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.16.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.16.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.16.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.17.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.17.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.17.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.18.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.18.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.18.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.19.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.19.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.19.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.20.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.20.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.20.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.21.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.21.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.21.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.22.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.22.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.22.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.23.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.23.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.23.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.24.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.24.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.24.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.25.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.25.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.25.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.26.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.26.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.26.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.27.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.27.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.27.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.28.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.28.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.28.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.29.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.29.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.29.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.30.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.30.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.30.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.31.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.31.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.31.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.32.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.32.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.32.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.33.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.33.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.33.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.34.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.34.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.34.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.35.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.35.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.35.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.36.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.36.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.36.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.37.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.37.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.37.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.38.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.38.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.38.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.39.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.39.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.39.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.40.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.40.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.40.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.41.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.41.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.41.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.42.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.42.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.42.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.43.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.43.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.43.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.44.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.44.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.44.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.45.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.45.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.45.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.46.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.46.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.46.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.47.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.47.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.47.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.48.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.48.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.48.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.49.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.49.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.49.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.50.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.50.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.50.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.51.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.51.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.51.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.52.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.52.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.52.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.53.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.53.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.53.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.54.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.54.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.54.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.55.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.55.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.55.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.56.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.56.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.56.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.57.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.57.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.57.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.58.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.58.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.58.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.59.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.59.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.59.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.60.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.60.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.60.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.61.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.61.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.61.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.62.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.62.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.62.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.63.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.63.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.63.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.64.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.64.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.64.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.65.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.65.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.65.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.66.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.66.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.66.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.67.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.67.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.67.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.68.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.68.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.68.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.69.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.69.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.69.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.70.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.70.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.70.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.71.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.71.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.71.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.72.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.72.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.72.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.73.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.73.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.73.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.74.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.74.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.74.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.75.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.75.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.75.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.76.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.76.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.76.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.77.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.77.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.77.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.78.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.78.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.78.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.79.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.79.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.79.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.80.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.80.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.80.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.81.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.81.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.81.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.82.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.82.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.82.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.83.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.83.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.83.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.84.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.84.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.84.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.85.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.85.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.85.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.86.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.86.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.86.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.87.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.87.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.87.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.88.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.88.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.88.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.89.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.89.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.89.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.90.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.90.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.90.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.91.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.91.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.91.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.92.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.92.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.92.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.93.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.93.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.93.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.94.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.94.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.94.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.95.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.95.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.95.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.96.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.96.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.96.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.97.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.97.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.97.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.98.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.98.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.98.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.99.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.99.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.99.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.100.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.100.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.100.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.101.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.101.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.101.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.102.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.102.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.102.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.103.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.103.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.103.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.104.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.104.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.104.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.105.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.105.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.105.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.106.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.106.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.106.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.107.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.107.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.107.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.108.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.108.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.108.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.109.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.109.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.109.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.110.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.110.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.110.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.111.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.111.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.111.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.112.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.112.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.112.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.113.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.113.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.113.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.114.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.114.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.114.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.115.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.115.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.115.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.116.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.116.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.116.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.117.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.117.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.117.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.118.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.118.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.118.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.119.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.119.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.119.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.120.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.120.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.120.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.121.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.121.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.121.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.122.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.122.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.122.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.123.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.123.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.123.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.124.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.124.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.124.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.125.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.125.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.125.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.126.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.126.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.126.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.127.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.127.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.127.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.128.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.128.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.128.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.129.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.129.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.129.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.130.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.130.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.130.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.131.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.131.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.131.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.132.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.132.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.132.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.133.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.133.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.133.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.134.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.134.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.134.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.135.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.135.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.135.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.136.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.136.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.136.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.137.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.137.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.137.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.138.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.138.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.138.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.139.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.139.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.139.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.140.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.140.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.140.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.141.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.141.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.141.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.142.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.142.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.142.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.143.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.143.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.143.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.144.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.144.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.144.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.145.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.145.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.145.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.146.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.146.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.146.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.147.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.147.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.147.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.148.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.148.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.148.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.149.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.149.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.149.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.150.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.150.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.150.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.151.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.151.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.151.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.152.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.152.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.152.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.153.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.153.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.153.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.154.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.154.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.154.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.155.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.155.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.155.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.156.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.156.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.156.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.157.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.157.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.157.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.158.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.158.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.158.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.159.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.159.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.159.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.160.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.160.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.160.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.161.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.161.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.161.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.162.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.162.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.162.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.163.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.163.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.163.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.164.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.164.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.164.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.165.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.165.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.165.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.166.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.166.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.166.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.167.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.167.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.167.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.168.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.168.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.168.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.169.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.169.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.169.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.170.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.170.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.170.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.171.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.171.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.171.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.172.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.172.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.172.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.173.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.173.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.173.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.174.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.174.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.174.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.175.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.175.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.175.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.176.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.176.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.176.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.177.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.177.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.177.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.178.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.178.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.178.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.179.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.179.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.179.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.180.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.180.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.180.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.181.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.181.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.181.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.182.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.182.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.182.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.183.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.183.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.183.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.184.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.184.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.184.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.185.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.185.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.185.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.186.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.186.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.186.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.187.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.187.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.187.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.188.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.188.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.188.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.189.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.189.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.189.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.190.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.190.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.190.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.191.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.191.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.191.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.192.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.192.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.192.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.193.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.193.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.193.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.194.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.194.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.194.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.195.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.195.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.195.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.196.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.196.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.196.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.197.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.197.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.197.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.198.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.198.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.198.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.199.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.199.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.199.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.200.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.200.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.200.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.201.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.201.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.201.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.202.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.202.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.202.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.203.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.203.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.203.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.204.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.204.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.204.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.205.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.205.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.205.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.206.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.206.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.206.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.207.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.207.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.207.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.208.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.208.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.208.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.209.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.209.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.209.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.210.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.210.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.210.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.211.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.211.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.211.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.212.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.212.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.212.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.213.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.213.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.213.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.214.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.214.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.214.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.215.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.215.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.215.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.216.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.216.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.216.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.217.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.217.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.217.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.218.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.218.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.218.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.219.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.219.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.219.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.220.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.220.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.220.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.221.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.221.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.221.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.222.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.222.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.222.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.223.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.223.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.223.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.224.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.224.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.224.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.225.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.225.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.225.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.226.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.226.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.226.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.227.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.227.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.227.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.228.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.228.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.228.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.229.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.229.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.229.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.230.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.230.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.230.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.231.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.231.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.231.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.232.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.232.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.232.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.233.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.233.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.233.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.234.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.234.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.234.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.235.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.235.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.235.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.236.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.236.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.236.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.237.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.237.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.237.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.238.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.238.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.238.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.239.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.239.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.239.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.240.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.240.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.240.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.241.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.241.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.241.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.242.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.242.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.242.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.243.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.243.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.243.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.244.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.244.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.244.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.245.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.245.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.245.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.246.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.246.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.246.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.247.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.247.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.247.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.248.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.248.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.248.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.249.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.249.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.249.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.250.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.250.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.250.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.251.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.251.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.251.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.252.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.252.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.252.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.253.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.253.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.253.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.254.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.254.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.254.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.255.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.255.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.255.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.input_layernorm.weight": "model-00084-of-000163.safetensors", + "model.layers.32.post_attention_layernorm.weight": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.q_a_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.q_a_layernorm.weight": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.q_b_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.kv_a_proj_with_mqa.weight": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.kv_a_layernorm.weight": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.kv_b_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.o_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.gate.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.gate.e_score_correction_bias": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.shared_experts.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.shared_experts.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.shared_experts.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.0.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.0.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.0.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.1.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.1.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.1.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.2.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.2.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.2.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.3.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.3.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.3.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.4.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.4.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.4.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.5.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.5.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.5.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.6.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.6.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.6.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.7.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.7.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.7.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.8.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.8.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.8.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.9.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.9.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.9.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.10.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.10.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.10.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.11.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.11.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.11.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.12.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.12.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.12.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.13.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.13.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.13.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.14.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.14.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.14.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.15.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.15.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.15.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.16.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.16.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.16.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.17.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.17.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.17.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.18.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.18.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.18.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.19.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.19.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.19.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.20.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.20.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.20.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.21.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.21.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.21.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.22.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.22.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.22.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.23.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.23.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.23.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.24.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.24.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.24.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.25.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.25.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.25.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.26.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.26.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.26.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.27.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.27.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.27.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.28.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.28.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.28.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.29.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.29.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.29.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.30.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.30.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.30.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.31.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.31.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.31.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.32.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.32.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.32.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.33.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.33.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.33.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.34.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.34.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.34.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.35.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.35.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.35.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.36.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.36.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.36.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.37.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.37.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.37.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.38.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.38.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.38.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.39.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.39.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.39.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.40.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.40.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.40.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.41.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.41.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.41.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.42.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.42.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.42.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.43.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.43.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.43.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.44.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.44.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.44.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.45.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.45.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.45.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.46.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.46.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.46.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.47.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.47.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.47.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.48.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.48.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.48.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.49.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.49.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.49.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.50.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.50.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.50.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.51.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.51.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.51.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.52.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.52.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.52.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.53.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.53.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.53.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.54.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.54.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.54.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.55.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.55.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.55.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.56.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.56.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.56.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.57.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.57.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.57.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.58.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.58.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.58.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.59.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.59.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.59.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.60.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.60.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.60.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.61.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.61.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.61.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.62.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.62.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.62.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.63.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.63.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.63.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.64.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.64.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.64.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.65.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.65.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.65.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.66.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.66.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.66.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.67.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.67.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.67.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.68.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.68.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.68.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.69.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.69.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.69.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.70.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.70.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.70.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.71.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.71.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.71.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.72.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.72.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.72.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.73.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.73.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.73.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.74.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.74.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.74.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.75.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.75.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.75.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.76.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.76.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.76.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.77.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.77.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.77.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.78.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.78.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.78.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.79.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.79.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.79.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.80.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.80.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.80.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.81.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.81.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.81.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.82.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.82.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.82.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.83.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.83.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.83.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.84.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.84.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.84.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.85.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.85.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.85.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.86.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.86.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.86.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.87.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.87.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.87.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.88.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.88.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.88.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.89.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.89.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.89.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.90.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.90.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.90.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.91.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.91.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.91.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.92.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.92.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.92.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.93.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.93.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.93.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.94.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.94.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.94.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.95.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.95.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.95.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.96.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.96.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.96.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.97.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.97.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.97.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.98.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.98.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.98.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.99.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.99.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.99.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.100.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.100.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.100.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.101.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.101.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.101.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.102.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.102.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.102.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.103.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.103.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.103.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.104.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.104.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.104.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.105.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.105.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.105.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.106.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.106.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.106.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.107.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.107.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.107.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.108.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.108.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.108.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.109.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.109.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.109.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.110.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.110.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.110.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.111.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.111.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.111.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.112.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.112.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.112.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.113.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.113.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.113.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.114.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.114.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.114.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.115.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.115.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.115.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.116.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.116.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.116.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.117.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.117.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.117.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.118.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.118.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.118.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.119.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.119.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.119.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.120.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.120.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.120.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.121.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.121.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.121.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.122.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.122.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.122.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.123.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.123.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.123.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.124.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.124.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.124.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.125.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.125.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.125.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.126.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.126.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.126.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.127.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.127.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.127.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.128.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.128.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.128.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.129.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.129.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.129.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.130.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.130.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.130.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.131.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.131.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.131.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.132.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.132.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.132.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.133.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.133.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.133.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.134.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.134.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.134.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.135.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.135.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.135.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.136.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.136.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.136.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.137.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.137.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.137.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.138.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.138.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.138.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.139.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.139.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.139.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.140.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.140.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.140.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.141.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.141.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.141.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.142.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.142.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.142.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.143.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.143.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.143.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.144.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.144.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.144.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.145.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.145.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.145.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.146.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.146.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.146.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.147.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.147.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.147.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.148.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.148.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.148.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.149.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.149.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.149.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.150.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.150.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.150.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.151.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.151.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.151.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.152.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.152.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.152.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.153.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.153.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.153.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.154.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.154.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.154.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.155.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.155.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.155.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.156.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.156.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.156.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.157.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.157.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.157.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.158.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.158.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.158.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.159.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.159.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.159.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.160.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.160.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.160.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.161.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.161.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.161.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.162.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.162.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.162.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.163.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.163.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.163.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.164.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.164.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.164.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.165.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.165.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.165.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.166.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.166.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.166.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.167.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.167.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.167.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.168.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.168.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.168.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.169.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.169.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.169.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.170.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.170.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.170.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.171.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.171.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.171.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.172.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.172.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.172.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.173.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.173.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.173.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.174.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.174.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.174.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.175.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.175.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.175.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.176.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.176.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.176.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.177.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.177.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.177.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.178.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.178.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.178.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.179.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.179.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.179.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.180.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.180.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.180.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.181.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.181.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.181.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.182.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.182.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.182.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.183.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.183.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.183.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.184.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.184.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.184.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.185.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.185.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.185.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.186.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.186.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.186.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.187.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.187.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.187.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.188.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.188.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.188.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.189.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.189.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.189.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.190.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.190.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.190.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.191.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.191.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.191.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.192.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.192.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.192.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.193.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.193.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.193.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.194.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.194.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.194.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.195.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.195.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.195.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.196.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.196.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.196.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.197.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.197.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.197.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.198.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.198.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.198.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.199.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.199.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.199.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.200.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.200.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.200.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.201.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.201.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.201.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.202.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.202.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.202.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.203.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.203.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.203.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.204.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.204.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.204.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.205.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.205.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.205.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.206.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.206.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.206.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.207.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.207.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.207.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.208.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.208.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.208.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.209.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.209.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.209.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.210.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.210.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.210.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.211.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.211.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.211.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.212.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.212.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.212.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.213.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.213.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.213.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.214.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.214.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.214.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.215.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.215.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.215.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.216.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.216.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.216.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.217.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.217.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.217.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.218.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.218.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.218.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.219.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.219.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.219.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.220.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.220.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.220.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.221.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.221.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.221.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.222.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.222.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.222.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.223.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.223.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.223.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.224.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.224.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.224.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.225.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.225.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.225.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.226.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.226.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.226.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.227.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.227.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.227.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.228.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.228.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.228.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.229.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.229.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.229.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.230.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.230.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.230.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.231.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.231.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.231.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.232.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.232.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.232.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.233.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.233.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.233.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.234.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.234.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.234.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.235.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.235.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.235.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.236.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.236.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.236.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.237.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.237.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.237.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.238.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.238.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.238.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.239.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.239.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.239.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.240.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.240.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.240.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.241.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.241.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.241.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.242.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.242.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.242.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.243.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.243.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.243.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.244.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.244.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.244.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.245.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.245.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.245.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.246.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.246.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.246.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.247.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.247.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.247.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.248.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.248.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.248.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.249.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.249.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.249.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.250.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.250.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.250.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.251.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.251.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.251.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.252.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.252.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.252.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.253.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.253.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.253.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.254.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.254.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.254.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.255.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.255.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.255.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.33.input_layernorm.weight": "model-00087-of-000163.safetensors", + "model.layers.33.post_attention_layernorm.weight": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.q_a_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.q_a_layernorm.weight": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.q_b_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.kv_a_proj_with_mqa.weight": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.kv_a_layernorm.weight": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.kv_b_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.o_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.gate.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.gate.e_score_correction_bias": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.shared_experts.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.shared_experts.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.shared_experts.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.0.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.0.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.0.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.1.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.1.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.1.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.2.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.2.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.2.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.3.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.3.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.3.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.4.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.4.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.4.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.5.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.5.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.5.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.6.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.6.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.6.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.7.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.7.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.7.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.8.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.8.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.8.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.9.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.9.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.9.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.10.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.10.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.10.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.11.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.11.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.11.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.12.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.12.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.12.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.13.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.13.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.13.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.14.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.14.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.14.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.15.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.15.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.15.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.16.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.16.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.16.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.17.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.17.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.17.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.18.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.18.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.18.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.19.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.19.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.19.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.20.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.20.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.20.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.21.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.21.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.21.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.22.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.22.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.22.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.23.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.23.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.23.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.24.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.24.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.24.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.25.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.25.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.25.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.26.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.26.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.26.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.27.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.27.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.27.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.28.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.28.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.28.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.29.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.29.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.29.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.30.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.30.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.30.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.31.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.31.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.31.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.32.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.32.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.32.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.33.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.33.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.33.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.34.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.34.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.34.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.35.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.35.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.35.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.36.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.36.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.36.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.37.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.37.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.37.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.38.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.38.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.38.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.39.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.39.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.39.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.40.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.40.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.40.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.41.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.41.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.41.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.42.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.42.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.42.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.43.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.43.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.43.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.44.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.44.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.44.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.45.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.45.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.45.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.46.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.46.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.46.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.47.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.47.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.47.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.48.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.48.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.48.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.49.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.49.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.49.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.50.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.50.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.50.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.51.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.51.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.51.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.52.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.52.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.52.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.53.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.53.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.53.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.54.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.54.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.54.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.55.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.55.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.55.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.56.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.56.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.56.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.57.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.57.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.57.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.58.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.58.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.58.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.59.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.59.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.59.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.60.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.60.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.60.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.61.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.61.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.61.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.62.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.62.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.62.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.63.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.63.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.63.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.64.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.64.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.64.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.65.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.65.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.65.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.66.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.66.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.66.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.67.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.67.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.67.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.68.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.68.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.68.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.69.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.69.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.69.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.70.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.70.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.70.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.71.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.71.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.71.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.72.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.72.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.72.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.73.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.73.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.73.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.74.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.74.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.74.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.75.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.75.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.75.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.76.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.76.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.76.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.77.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.77.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.77.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.78.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.78.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.78.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.79.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.79.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.79.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.80.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.80.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.80.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.81.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.81.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.81.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.82.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.82.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.82.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.83.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.83.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.83.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.84.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.84.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.84.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.85.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.85.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.85.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.86.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.86.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.86.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.87.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.87.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.87.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.88.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.88.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.88.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.89.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.89.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.89.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.90.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.90.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.90.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.91.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.91.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.91.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.92.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.92.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.92.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.93.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.93.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.93.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.94.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.94.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.94.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.95.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.95.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.95.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.96.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.96.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.96.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.97.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.97.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.97.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.98.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.98.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.98.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.99.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.99.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.99.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.100.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.100.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.100.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.101.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.101.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.101.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.102.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.102.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.102.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.103.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.103.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.103.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.104.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.104.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.104.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.105.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.105.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.105.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.106.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.106.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.106.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.107.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.107.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.107.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.108.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.108.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.108.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.109.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.109.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.109.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.110.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.110.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.110.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.111.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.111.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.111.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.112.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.112.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.112.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.113.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.113.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.113.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.114.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.114.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.114.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.115.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.115.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.115.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.116.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.116.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.116.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.117.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.117.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.117.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.118.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.118.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.118.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.119.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.119.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.119.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.120.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.120.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.120.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.121.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.121.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.121.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.122.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.122.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.122.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.123.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.123.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.123.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.124.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.124.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.124.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.125.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.125.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.125.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.126.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.126.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.126.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.127.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.127.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.127.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.128.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.128.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.128.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.129.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.129.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.129.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.130.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.130.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.130.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.131.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.131.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.131.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.132.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.132.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.132.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.133.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.133.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.133.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.134.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.134.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.134.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.135.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.135.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.135.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.136.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.136.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.136.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.137.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.137.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.137.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.138.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.138.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.138.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.139.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.139.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.139.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.140.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.140.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.140.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.141.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.141.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.141.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.142.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.142.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.142.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.143.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.143.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.143.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.144.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.144.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.144.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.145.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.145.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.145.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.146.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.146.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.146.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.147.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.147.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.147.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.148.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.148.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.148.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.149.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.149.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.149.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.150.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.150.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.150.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.151.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.151.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.151.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.152.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.152.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.152.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.153.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.153.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.153.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.154.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.154.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.154.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.155.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.155.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.155.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.156.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.156.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.156.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.157.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.157.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.157.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.158.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.158.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.158.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.159.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.159.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.159.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.160.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.160.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.160.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.161.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.161.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.161.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.162.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.162.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.162.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.163.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.163.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.163.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.164.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.164.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.164.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.165.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.165.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.165.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.166.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.166.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.166.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.167.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.167.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.167.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.168.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.168.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.168.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.169.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.169.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.169.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.170.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.170.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.170.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.171.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.171.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.171.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.172.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.172.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.172.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.173.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.173.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.173.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.174.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.174.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.174.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.175.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.175.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.175.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.176.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.176.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.176.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.177.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.177.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.177.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.178.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.178.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.178.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.179.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.179.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.179.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.180.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.180.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.180.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.181.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.181.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.181.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.182.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.182.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.182.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.183.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.183.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.183.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.184.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.184.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.184.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.185.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.185.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.185.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.186.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.186.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.186.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.187.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.187.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.187.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.188.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.188.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.188.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.189.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.189.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.189.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.190.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.190.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.190.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.191.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.191.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.191.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.192.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.192.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.192.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.193.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.193.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.193.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.194.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.194.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.194.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.195.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.195.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.195.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.196.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.196.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.196.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.197.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.197.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.197.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.198.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.198.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.198.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.199.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.199.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.199.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.200.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.200.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.200.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.201.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.201.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.201.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.202.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.202.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.202.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.203.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.203.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.203.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.204.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.204.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.204.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.205.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.205.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.205.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.206.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.206.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.206.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.207.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.207.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.207.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.208.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.208.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.208.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.209.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.209.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.209.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.210.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.210.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.210.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.211.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.211.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.211.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.212.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.212.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.212.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.213.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.213.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.213.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.214.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.214.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.214.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.215.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.215.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.215.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.216.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.216.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.216.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.217.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.217.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.217.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.218.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.218.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.218.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.219.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.219.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.219.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.220.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.220.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.220.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.221.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.221.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.221.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.222.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.222.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.222.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.223.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.223.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.223.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.224.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.224.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.224.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.225.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.225.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.225.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.226.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.226.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.226.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.227.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.227.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.227.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.228.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.228.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.228.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.229.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.229.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.229.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.230.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.230.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.230.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.231.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.231.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.231.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.232.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.232.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.232.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.233.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.233.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.233.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.234.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.234.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.234.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.235.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.235.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.235.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.236.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.236.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.236.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.237.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.237.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.237.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.238.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.238.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.238.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.239.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.239.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.239.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.240.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.240.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.240.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.241.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.241.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.241.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.242.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.242.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.242.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.243.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.243.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.243.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.244.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.244.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.244.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.245.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.245.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.245.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.246.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.246.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.246.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.247.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.247.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.247.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.248.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.248.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.248.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.249.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.249.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.249.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.250.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.250.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.250.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.251.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.251.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.251.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.252.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.252.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.252.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.253.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.253.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.253.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.254.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.254.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.254.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.255.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.255.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.255.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.input_layernorm.weight": "model-00089-of-000163.safetensors", + "model.layers.34.post_attention_layernorm.weight": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.q_a_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.q_a_layernorm.weight": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.q_b_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.kv_a_proj_with_mqa.weight": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.kv_a_layernorm.weight": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.kv_b_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.o_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.gate.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.gate.e_score_correction_bias": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.shared_experts.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.shared_experts.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.shared_experts.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.0.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.0.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.0.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.1.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.1.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.1.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.2.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.2.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.2.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.3.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.3.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.3.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.4.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.4.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.4.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.5.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.5.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.5.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.6.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.6.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.6.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.7.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.7.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.7.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.8.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.8.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.8.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.9.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.9.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.9.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.10.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.10.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.10.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.11.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.11.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.11.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.12.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.12.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.12.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.13.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.13.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.13.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.14.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.14.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.14.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.15.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.15.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.15.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.16.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.16.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.16.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.17.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.17.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.17.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.18.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.18.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.18.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.19.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.19.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.19.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.20.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.20.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.20.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.21.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.21.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.21.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.22.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.22.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.22.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.23.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.23.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.23.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.24.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.24.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.24.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.25.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.25.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.25.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.26.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.26.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.26.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.27.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.27.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.27.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.28.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.28.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.28.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.29.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.29.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.29.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.30.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.30.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.30.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.31.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.31.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.31.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.32.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.32.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.32.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.33.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.33.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.33.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.34.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.34.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.34.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.35.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.35.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.35.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.36.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.36.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.36.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.37.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.37.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.37.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.38.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.38.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.38.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.39.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.39.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.39.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.40.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.40.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.40.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.41.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.41.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.41.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.42.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.42.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.42.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.43.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.43.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.43.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.44.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.44.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.44.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.45.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.45.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.45.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.46.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.46.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.46.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.47.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.47.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.47.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.48.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.48.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.48.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.49.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.49.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.49.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.50.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.50.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.50.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.51.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.51.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.51.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.52.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.52.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.52.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.53.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.53.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.53.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.54.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.54.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.54.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.55.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.55.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.55.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.56.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.56.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.56.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.57.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.57.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.57.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.58.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.58.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.58.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.59.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.59.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.59.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.60.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.60.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.60.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.61.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.61.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.61.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.62.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.62.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.62.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.63.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.63.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.63.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.64.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.64.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.64.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.65.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.65.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.65.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.66.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.66.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.66.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.67.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.67.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.67.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.68.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.68.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.68.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.69.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.69.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.69.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.70.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.70.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.70.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.71.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.71.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.71.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.72.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.72.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.72.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.73.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.73.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.73.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.74.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.74.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.74.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.75.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.75.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.75.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.76.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.76.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.76.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.77.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.77.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.77.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.78.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.78.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.78.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.79.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.79.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.79.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.80.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.80.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.80.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.81.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.81.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.81.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.82.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.82.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.82.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.83.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.83.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.83.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.84.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.84.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.84.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.85.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.85.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.85.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.86.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.86.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.86.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.87.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.87.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.87.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.88.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.88.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.88.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.89.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.89.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.89.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.90.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.90.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.90.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.91.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.91.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.91.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.92.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.92.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.92.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.93.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.93.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.93.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.94.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.94.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.94.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.95.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.95.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.95.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.96.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.96.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.96.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.97.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.97.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.97.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.98.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.98.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.98.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.99.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.99.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.99.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.100.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.100.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.100.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.101.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.101.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.101.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.102.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.102.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.102.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.103.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.103.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.103.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.104.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.104.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.104.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.105.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.105.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.105.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.106.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.106.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.106.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.107.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.107.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.107.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.108.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.108.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.108.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.109.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.109.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.109.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.110.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.110.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.110.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.111.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.111.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.111.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.112.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.112.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.112.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.113.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.113.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.113.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.114.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.114.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.114.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.115.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.115.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.115.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.116.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.116.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.116.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.117.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.117.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.117.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.118.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.118.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.118.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.119.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.119.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.119.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.120.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.120.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.120.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.121.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.121.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.121.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.122.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.122.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.122.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.123.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.123.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.123.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.124.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.124.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.124.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.125.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.125.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.125.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.126.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.126.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.126.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.127.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.127.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.127.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.128.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.128.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.128.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.129.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.129.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.129.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.130.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.130.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.130.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.131.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.131.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.131.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.132.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.132.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.132.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.133.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.133.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.133.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.134.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.134.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.134.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.135.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.135.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.135.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.136.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.136.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.136.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.137.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.137.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.137.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.138.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.138.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.138.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.139.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.139.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.139.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.140.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.140.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.140.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.141.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.141.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.141.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.142.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.142.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.142.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.143.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.143.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.143.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.144.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.144.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.144.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.145.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.145.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.145.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.146.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.146.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.146.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.147.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.147.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.147.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.148.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.148.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.148.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.149.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.149.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.149.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.150.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.150.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.150.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.151.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.151.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.151.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.152.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.152.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.152.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.153.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.153.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.153.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.154.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.154.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.154.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.155.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.155.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.155.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.156.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.156.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.156.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.157.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.157.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.157.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.158.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.158.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.158.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.159.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.159.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.159.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.160.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.160.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.160.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.161.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.161.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.161.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.162.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.162.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.162.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.163.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.163.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.163.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.164.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.164.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.164.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.165.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.165.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.165.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.166.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.166.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.166.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.167.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.167.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.167.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.168.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.168.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.168.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.169.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.169.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.169.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.170.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.170.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.170.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.171.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.171.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.171.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.172.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.172.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.172.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.173.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.173.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.173.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.174.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.174.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.174.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.175.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.175.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.175.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.176.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.176.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.176.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.177.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.177.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.177.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.178.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.178.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.178.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.179.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.179.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.179.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.180.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.180.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.180.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.181.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.181.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.181.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.182.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.182.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.182.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.183.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.183.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.183.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.184.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.184.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.184.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.185.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.185.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.185.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.186.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.186.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.186.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.187.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.187.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.187.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.188.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.188.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.188.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.189.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.189.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.189.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.190.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.190.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.190.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.191.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.191.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.191.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.192.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.192.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.192.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.193.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.193.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.193.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.194.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.194.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.194.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.195.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.195.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.195.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.196.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.196.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.196.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.197.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.197.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.197.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.198.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.198.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.198.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.199.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.199.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.199.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.200.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.200.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.200.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.201.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.201.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.201.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.202.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.202.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.202.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.203.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.203.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.203.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.204.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.204.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.204.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.205.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.205.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.205.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.206.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.206.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.206.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.207.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.207.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.207.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.208.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.208.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.208.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.209.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.209.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.209.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.210.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.210.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.210.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.211.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.211.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.211.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.212.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.212.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.212.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.213.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.213.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.213.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.214.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.214.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.214.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.215.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.215.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.215.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.216.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.216.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.216.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.217.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.217.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.217.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.218.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.218.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.218.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.219.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.219.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.219.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.220.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.220.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.220.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.221.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.221.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.221.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.222.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.222.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.222.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.223.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.223.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.223.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.224.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.224.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.224.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.225.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.225.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.225.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.226.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.226.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.226.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.227.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.227.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.227.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.228.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.228.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.228.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.229.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.229.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.229.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.230.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.230.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.230.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.231.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.231.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.231.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.232.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.232.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.232.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.233.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.233.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.233.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.234.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.234.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.234.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.235.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.235.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.235.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.236.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.236.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.236.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.237.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.237.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.237.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.238.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.238.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.238.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.239.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.239.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.239.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.240.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.240.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.240.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.241.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.241.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.241.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.242.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.242.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.242.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.243.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.243.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.243.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.244.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.244.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.244.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.245.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.245.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.245.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.246.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.246.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.246.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.247.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.247.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.247.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.248.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.248.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.248.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.249.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.249.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.249.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.250.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.250.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.250.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.251.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.251.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.251.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.252.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.252.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.252.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.253.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.253.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.253.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.254.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.254.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.254.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.255.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.255.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.255.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.input_layernorm.weight": "model-00092-of-000163.safetensors", + "model.layers.35.post_attention_layernorm.weight": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.q_a_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.q_a_layernorm.weight": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.q_b_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.kv_a_proj_with_mqa.weight": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.kv_a_layernorm.weight": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.kv_b_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.o_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.gate.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.gate.e_score_correction_bias": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.shared_experts.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.shared_experts.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.shared_experts.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.0.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.0.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.0.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.1.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.1.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.1.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.2.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.2.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.2.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.3.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.3.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.3.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.4.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.4.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.4.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.5.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.5.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.5.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.6.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.6.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.6.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.7.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.7.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.7.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.8.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.8.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.8.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.9.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.9.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.9.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.10.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.10.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.10.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.11.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.11.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.11.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.12.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.12.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.12.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.13.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.13.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.13.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.14.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.14.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.14.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.15.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.15.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.15.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.16.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.16.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.16.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.17.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.17.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.17.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.18.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.18.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.18.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.19.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.19.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.19.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.20.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.20.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.20.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.21.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.21.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.21.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.22.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.22.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.22.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.23.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.23.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.23.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.24.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.24.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.24.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.25.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.25.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.25.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.26.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.26.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.26.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.27.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.27.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.27.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.28.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.28.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.28.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.29.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.29.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.29.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.30.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.30.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.30.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.31.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.31.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.31.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.32.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.32.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.32.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.33.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.33.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.33.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.34.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.34.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.34.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.35.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.35.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.35.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.36.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.36.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.36.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.37.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.37.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.37.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.38.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.38.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.38.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.39.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.39.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.39.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.40.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.40.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.40.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.41.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.41.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.41.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.42.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.42.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.42.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.43.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.43.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.43.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.44.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.44.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.44.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.45.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.45.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.45.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.46.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.46.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.46.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.47.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.47.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.47.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.48.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.48.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.48.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.49.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.49.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.49.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.50.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.50.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.50.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.51.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.51.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.51.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.52.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.52.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.52.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.53.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.53.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.53.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.54.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.54.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.54.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.55.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.55.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.55.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.56.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.56.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.56.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.57.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.57.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.57.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.58.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.58.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.58.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.59.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.59.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.59.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.60.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.60.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.60.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.61.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.61.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.61.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.62.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.62.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.62.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.63.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.63.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.63.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.64.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.64.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.64.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.65.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.65.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.65.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.66.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.66.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.66.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.67.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.67.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.67.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.68.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.68.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.68.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.69.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.69.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.69.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.70.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.70.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.70.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.71.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.71.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.71.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.72.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.72.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.72.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.73.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.73.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.73.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.74.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.74.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.74.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.75.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.75.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.75.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.76.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.76.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.76.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.77.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.77.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.77.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.78.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.78.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.78.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.79.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.79.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.79.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.80.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.80.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.80.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.81.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.81.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.81.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.82.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.82.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.82.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.83.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.83.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.83.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.84.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.84.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.84.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.85.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.85.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.85.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.86.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.86.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.86.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.87.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.87.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.87.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.88.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.88.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.88.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.89.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.89.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.89.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.90.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.90.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.90.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.91.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.91.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.91.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.92.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.92.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.92.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.93.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.93.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.93.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.94.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.94.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.94.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.95.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.95.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.95.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.96.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.96.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.96.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.97.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.97.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.97.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.98.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.98.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.98.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.99.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.99.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.99.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.100.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.100.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.100.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.101.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.101.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.101.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.102.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.102.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.102.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.103.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.103.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.103.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.104.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.104.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.104.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.105.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.105.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.105.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.106.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.106.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.106.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.107.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.107.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.107.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.108.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.108.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.108.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.109.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.109.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.109.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.110.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.110.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.110.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.111.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.111.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.111.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.112.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.112.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.112.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.113.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.113.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.113.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.114.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.114.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.114.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.115.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.115.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.115.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.116.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.116.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.116.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.117.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.117.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.117.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.118.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.118.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.118.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.119.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.119.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.119.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.120.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.120.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.120.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.121.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.121.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.121.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.122.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.122.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.122.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.123.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.123.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.123.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.124.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.124.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.124.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.125.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.125.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.125.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.126.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.126.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.126.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.127.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.127.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.127.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.128.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.128.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.128.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.129.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.129.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.129.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.130.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.130.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.130.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.131.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.131.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.131.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.132.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.132.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.132.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.133.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.133.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.133.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.134.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.134.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.134.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.135.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.135.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.135.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.136.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.136.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.136.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.137.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.137.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.137.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.138.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.138.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.138.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.139.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.139.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.139.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.140.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.140.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.140.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.141.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.141.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.141.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.142.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.142.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.142.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.143.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.143.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.143.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.144.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.144.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.144.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.145.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.145.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.145.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.146.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.146.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.146.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.147.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.147.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.147.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.148.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.148.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.148.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.149.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.149.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.149.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.150.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.150.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.150.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.151.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.151.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.151.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.152.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.152.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.152.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.153.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.153.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.153.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.154.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.154.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.154.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.155.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.155.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.155.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.156.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.156.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.156.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.157.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.157.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.157.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.158.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.158.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.158.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.159.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.159.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.159.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.160.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.160.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.160.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.161.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.161.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.161.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.162.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.162.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.162.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.163.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.163.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.163.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.164.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.164.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.164.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.165.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.165.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.165.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.166.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.166.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.166.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.167.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.167.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.167.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.168.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.168.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.168.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.169.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.169.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.169.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.170.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.170.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.170.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.171.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.171.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.171.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.172.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.172.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.172.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.173.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.173.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.173.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.174.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.174.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.174.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.175.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.175.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.175.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.176.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.176.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.176.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.177.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.177.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.177.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.178.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.178.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.178.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.179.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.179.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.179.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.180.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.180.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.180.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.181.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.181.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.181.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.182.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.182.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.182.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.183.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.183.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.183.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.184.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.184.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.184.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.185.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.185.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.185.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.186.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.186.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.186.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.187.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.187.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.187.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.188.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.188.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.188.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.189.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.189.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.189.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.190.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.190.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.190.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.191.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.191.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.191.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.192.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.192.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.192.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.193.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.193.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.193.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.194.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.194.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.194.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.195.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.195.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.195.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.196.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.196.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.196.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.197.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.197.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.197.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.198.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.198.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.198.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.199.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.199.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.199.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.200.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.200.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.200.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.201.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.201.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.201.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.202.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.202.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.202.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.203.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.203.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.203.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.204.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.204.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.204.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.205.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.205.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.205.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.206.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.206.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.206.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.207.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.207.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.207.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.208.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.208.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.208.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.209.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.209.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.209.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.210.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.210.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.210.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.211.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.211.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.211.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.212.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.212.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.212.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.213.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.213.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.213.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.214.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.214.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.214.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.215.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.215.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.215.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.216.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.216.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.216.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.217.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.217.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.217.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.218.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.218.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.218.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.219.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.219.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.219.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.220.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.220.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.220.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.221.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.221.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.221.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.222.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.222.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.222.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.223.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.223.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.223.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.224.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.224.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.224.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.225.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.225.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.225.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.226.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.226.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.226.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.227.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.227.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.227.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.228.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.228.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.228.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.229.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.229.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.229.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.230.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.230.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.230.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.231.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.231.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.231.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.232.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.232.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.232.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.233.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.233.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.233.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.234.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.234.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.234.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.235.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.235.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.235.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.236.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.236.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.236.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.237.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.237.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.237.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.238.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.238.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.238.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.239.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.239.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.239.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.240.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.240.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.240.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.241.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.241.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.241.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.242.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.242.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.242.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.243.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.243.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.243.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.244.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.244.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.244.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.245.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.245.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.245.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.246.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.246.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.246.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.247.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.247.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.247.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.248.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.248.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.248.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.249.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.249.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.249.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.250.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.250.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.250.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.251.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.251.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.251.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.252.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.252.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.252.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.253.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.253.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.253.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.254.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.254.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.254.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.255.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.255.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.255.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.input_layernorm.weight": "model-00095-of-000163.safetensors", + "model.layers.36.post_attention_layernorm.weight": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.q_a_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.q_a_layernorm.weight": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.q_b_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.kv_a_proj_with_mqa.weight": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.kv_a_layernorm.weight": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.kv_b_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.o_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.gate.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.gate.e_score_correction_bias": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.shared_experts.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.shared_experts.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.shared_experts.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.0.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.0.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.0.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.1.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.1.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.1.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.2.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.2.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.2.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.3.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.3.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.3.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.4.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.4.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.4.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.5.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.5.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.5.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.6.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.6.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.6.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.7.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.7.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.7.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.8.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.8.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.8.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.9.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.9.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.9.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.10.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.10.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.10.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.11.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.11.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.11.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.12.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.12.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.12.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.13.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.13.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.13.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.14.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.14.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.14.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.15.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.15.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.15.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.16.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.16.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.16.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.17.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.17.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.17.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.18.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.18.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.18.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.19.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.19.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.19.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.20.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.20.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.20.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.21.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.21.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.21.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.22.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.22.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.22.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.23.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.23.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.23.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.24.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.24.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.24.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.25.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.25.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.25.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.26.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.26.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.26.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.27.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.27.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.27.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.28.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.28.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.28.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.29.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.29.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.29.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.30.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.30.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.30.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.31.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.31.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.31.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.32.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.32.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.32.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.33.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.33.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.33.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.34.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.34.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.34.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.35.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.35.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.35.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.36.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.36.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.36.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.37.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.37.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.37.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.38.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.38.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.38.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.39.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.39.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.39.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.40.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.40.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.40.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.41.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.41.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.41.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.42.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.42.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.42.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.43.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.43.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.43.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.44.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.44.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.44.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.45.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.45.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.45.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.46.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.46.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.46.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.47.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.47.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.47.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.48.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.48.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.48.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.49.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.49.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.49.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.50.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.50.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.50.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.51.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.51.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.51.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.52.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.52.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.52.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.53.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.53.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.53.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.54.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.54.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.54.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.55.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.55.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.55.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.56.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.56.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.56.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.57.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.57.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.57.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.58.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.58.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.58.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.59.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.59.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.59.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.60.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.60.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.60.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.61.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.61.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.61.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.62.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.62.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.62.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.63.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.63.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.63.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.64.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.64.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.64.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.65.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.65.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.65.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.66.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.66.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.66.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.67.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.67.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.67.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.68.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.68.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.68.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.69.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.69.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.69.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.70.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.70.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.70.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.71.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.71.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.71.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.72.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.72.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.72.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.73.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.73.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.73.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.74.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.74.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.74.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.75.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.75.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.75.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.76.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.76.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.76.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.77.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.77.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.77.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.78.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.78.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.78.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.79.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.79.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.79.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.80.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.80.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.80.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.81.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.81.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.81.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.82.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.82.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.82.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.83.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.83.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.83.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.84.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.84.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.84.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.85.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.85.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.85.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.86.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.86.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.86.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.87.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.87.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.87.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.88.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.88.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.88.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.89.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.89.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.89.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.90.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.90.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.90.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.91.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.91.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.91.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.92.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.92.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.92.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.93.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.93.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.93.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.94.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.94.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.94.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.95.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.95.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.95.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.96.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.96.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.96.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.97.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.97.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.97.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.98.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.98.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.98.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.99.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.99.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.99.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.100.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.100.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.100.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.101.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.101.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.101.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.102.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.102.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.102.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.103.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.103.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.103.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.104.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.104.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.104.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.105.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.105.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.105.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.106.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.106.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.106.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.107.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.107.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.107.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.108.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.108.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.108.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.109.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.109.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.109.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.110.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.110.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.110.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.111.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.111.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.111.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.112.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.112.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.112.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.113.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.113.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.113.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.114.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.114.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.114.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.115.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.115.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.115.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.116.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.116.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.116.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.117.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.117.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.117.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.118.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.118.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.118.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.119.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.119.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.119.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.120.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.120.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.120.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.121.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.121.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.121.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.122.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.122.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.122.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.123.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.123.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.123.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.124.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.124.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.124.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.125.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.125.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.125.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.126.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.126.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.126.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.127.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.127.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.127.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.128.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.128.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.128.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.129.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.129.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.129.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.130.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.130.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.130.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.131.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.131.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.131.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.132.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.132.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.132.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.133.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.133.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.133.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.134.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.134.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.134.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.135.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.135.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.135.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.136.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.136.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.136.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.137.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.137.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.137.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.138.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.138.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.138.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.139.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.139.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.139.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.140.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.140.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.140.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.141.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.141.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.141.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.142.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.142.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.142.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.143.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.143.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.143.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.144.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.144.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.144.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.145.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.145.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.145.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.146.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.146.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.146.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.147.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.147.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.147.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.148.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.148.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.148.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.149.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.149.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.149.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.150.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.150.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.150.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.151.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.151.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.151.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.152.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.152.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.152.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.153.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.153.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.153.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.154.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.154.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.154.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.155.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.155.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.155.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.156.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.156.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.156.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.157.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.157.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.157.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.158.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.158.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.158.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.159.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.159.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.159.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.160.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.160.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.160.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.161.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.161.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.161.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.162.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.162.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.162.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.163.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.163.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.163.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.164.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.164.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.164.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.165.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.165.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.165.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.166.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.166.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.166.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.167.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.167.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.167.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.168.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.168.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.168.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.169.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.169.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.169.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.170.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.170.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.170.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.171.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.171.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.171.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.172.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.172.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.172.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.173.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.173.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.173.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.174.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.174.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.174.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.175.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.175.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.175.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.176.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.176.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.176.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.177.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.177.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.177.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.178.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.178.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.178.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.179.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.179.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.179.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.180.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.180.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.180.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.181.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.181.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.181.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.182.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.182.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.182.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.183.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.183.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.183.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.184.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.184.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.184.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.185.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.185.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.185.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.186.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.186.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.186.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.187.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.187.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.187.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.188.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.188.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.188.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.189.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.189.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.189.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.190.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.190.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.190.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.191.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.191.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.191.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.192.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.192.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.192.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.193.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.193.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.193.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.194.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.194.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.194.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.195.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.195.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.195.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.196.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.196.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.196.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.197.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.197.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.197.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.198.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.198.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.198.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.199.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.199.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.199.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.200.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.200.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.200.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.201.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.201.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.201.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.202.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.202.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.202.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.203.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.203.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.203.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.204.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.204.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.204.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.205.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.205.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.205.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.206.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.206.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.206.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.207.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.207.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.207.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.208.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.208.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.208.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.209.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.209.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.209.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.210.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.210.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.210.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.211.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.211.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.211.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.212.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.212.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.212.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.213.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.213.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.213.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.214.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.214.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.214.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.215.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.215.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.215.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.216.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.216.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.216.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.217.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.217.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.217.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.218.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.218.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.218.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.219.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.219.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.219.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.220.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.220.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.220.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.221.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.221.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.221.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.222.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.222.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.222.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.223.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.223.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.223.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.224.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.224.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.224.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.225.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.225.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.225.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.226.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.226.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.226.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.227.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.227.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.227.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.228.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.228.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.228.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.229.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.229.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.229.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.230.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.230.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.230.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.231.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.231.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.231.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.232.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.232.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.232.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.233.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.233.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.233.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.234.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.234.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.234.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.235.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.235.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.235.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.236.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.236.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.236.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.237.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.237.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.237.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.238.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.238.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.238.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.239.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.239.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.239.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.240.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.240.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.240.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.241.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.241.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.241.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.242.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.242.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.242.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.243.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.243.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.243.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.244.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.244.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.244.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.245.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.245.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.245.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.246.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.246.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.246.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.247.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.247.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.247.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.248.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.248.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.248.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.249.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.249.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.249.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.250.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.250.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.250.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.251.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.251.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.251.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.252.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.252.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.252.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.253.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.253.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.253.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.254.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.254.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.254.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.255.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.255.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.255.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.input_layernorm.weight": "model-00097-of-000163.safetensors", + "model.layers.37.post_attention_layernorm.weight": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.q_a_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.q_a_layernorm.weight": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.q_b_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.kv_a_proj_with_mqa.weight": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.kv_a_layernorm.weight": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.kv_b_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.o_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.gate.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.gate.e_score_correction_bias": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.shared_experts.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.shared_experts.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.shared_experts.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.0.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.0.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.0.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.1.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.1.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.1.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.2.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.2.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.2.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.3.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.3.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.3.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.4.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.4.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.4.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.5.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.5.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.5.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.6.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.6.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.6.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.7.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.7.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.7.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.8.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.8.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.8.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.9.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.9.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.9.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.10.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.10.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.10.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.11.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.11.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.11.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.12.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.12.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.12.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.13.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.13.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.13.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.14.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.14.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.14.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.15.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.15.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.15.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.16.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.16.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.16.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.17.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.17.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.17.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.18.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.18.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.18.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.19.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.19.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.19.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.20.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.20.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.20.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.21.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.21.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.21.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.22.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.22.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.22.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.23.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.23.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.23.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.24.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.24.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.24.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.25.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.25.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.25.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.26.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.26.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.26.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.27.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.27.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.27.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.28.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.28.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.28.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.29.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.29.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.29.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.30.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.30.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.30.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.31.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.31.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.31.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.32.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.32.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.32.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.33.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.33.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.33.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.34.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.34.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.34.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.35.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.35.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.35.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.36.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.36.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.36.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.37.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.37.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.37.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.38.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.38.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.38.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.39.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.39.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.39.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.40.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.40.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.40.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.41.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.41.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.41.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.42.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.42.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.42.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.43.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.43.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.43.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.44.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.44.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.44.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.45.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.45.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.45.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.46.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.46.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.46.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.47.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.47.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.47.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.48.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.48.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.48.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.49.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.49.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.49.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.50.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.50.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.50.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.51.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.51.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.51.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.52.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.52.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.52.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.53.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.53.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.53.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.54.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.54.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.54.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.55.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.55.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.55.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.56.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.56.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.56.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.57.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.57.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.57.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.58.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.58.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.58.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.59.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.59.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.59.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.60.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.60.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.60.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.61.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.61.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.61.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.62.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.62.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.62.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.63.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.63.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.63.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.64.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.64.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.64.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.65.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.65.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.65.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.66.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.66.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.66.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.67.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.67.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.67.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.68.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.68.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.68.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.69.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.69.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.69.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.70.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.70.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.70.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.71.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.71.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.71.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.72.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.72.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.72.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.73.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.73.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.73.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.74.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.74.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.74.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.75.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.75.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.75.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.76.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.76.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.76.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.77.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.77.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.77.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.78.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.78.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.78.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.79.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.79.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.79.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.80.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.80.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.80.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.81.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.81.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.81.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.82.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.82.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.82.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.83.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.83.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.83.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.84.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.84.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.84.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.85.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.85.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.85.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.86.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.86.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.86.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.87.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.87.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.87.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.88.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.88.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.88.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.89.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.89.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.89.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.90.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.90.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.90.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.91.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.91.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.91.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.92.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.92.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.92.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.93.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.93.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.93.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.94.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.94.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.94.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.95.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.95.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.95.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.96.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.96.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.96.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.97.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.97.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.97.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.98.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.98.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.98.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.99.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.99.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.99.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.100.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.100.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.100.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.101.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.101.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.101.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.102.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.102.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.102.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.103.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.103.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.103.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.104.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.104.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.104.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.105.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.105.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.105.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.106.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.106.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.106.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.107.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.107.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.107.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.108.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.108.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.108.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.109.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.109.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.109.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.110.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.110.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.110.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.111.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.111.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.111.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.112.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.112.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.112.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.113.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.113.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.113.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.114.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.114.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.114.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.115.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.115.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.115.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.116.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.116.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.116.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.117.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.117.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.117.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.118.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.118.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.118.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.119.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.119.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.119.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.120.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.120.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.120.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.121.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.121.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.121.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.122.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.122.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.122.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.123.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.123.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.123.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.124.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.124.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.124.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.125.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.125.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.125.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.126.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.126.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.126.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.127.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.127.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.127.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.128.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.128.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.128.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.129.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.129.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.129.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.130.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.130.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.130.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.131.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.131.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.131.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.132.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.132.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.132.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.133.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.133.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.133.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.134.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.134.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.134.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.135.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.135.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.135.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.136.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.136.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.136.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.137.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.137.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.137.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.138.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.138.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.138.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.139.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.139.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.139.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.140.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.140.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.140.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.141.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.141.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.141.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.142.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.142.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.142.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.143.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.143.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.143.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.144.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.144.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.144.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.145.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.145.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.145.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.146.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.146.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.146.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.147.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.147.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.147.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.148.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.148.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.148.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.149.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.149.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.149.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.150.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.150.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.150.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.151.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.151.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.151.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.152.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.152.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.152.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.153.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.153.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.153.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.154.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.154.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.154.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.155.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.155.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.155.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.156.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.156.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.156.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.157.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.157.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.157.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.158.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.158.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.158.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.159.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.159.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.159.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.160.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.160.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.160.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.161.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.161.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.161.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.162.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.162.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.162.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.163.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.163.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.163.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.164.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.164.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.164.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.165.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.165.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.165.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.166.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.166.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.166.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.167.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.167.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.167.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.168.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.168.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.168.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.169.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.169.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.169.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.170.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.170.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.170.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.171.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.171.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.171.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.172.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.172.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.172.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.173.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.173.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.173.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.174.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.174.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.174.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.175.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.175.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.175.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.176.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.176.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.176.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.177.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.177.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.177.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.178.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.178.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.178.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.179.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.179.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.179.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.180.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.180.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.180.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.181.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.181.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.181.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.182.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.182.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.182.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.183.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.183.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.183.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.184.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.184.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.184.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.185.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.185.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.185.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.186.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.186.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.186.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.187.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.187.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.187.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.188.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.188.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.188.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.189.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.189.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.189.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.190.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.190.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.190.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.191.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.191.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.191.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.192.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.192.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.192.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.193.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.193.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.193.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.194.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.194.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.194.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.195.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.195.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.195.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.196.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.196.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.196.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.197.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.197.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.197.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.198.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.198.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.198.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.199.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.199.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.199.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.200.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.200.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.200.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.201.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.201.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.201.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.202.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.202.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.202.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.203.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.203.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.203.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.204.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.204.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.204.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.205.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.205.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.205.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.206.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.206.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.206.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.207.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.207.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.207.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.208.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.208.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.208.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.209.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.209.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.209.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.210.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.210.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.210.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.211.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.211.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.211.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.212.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.212.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.212.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.213.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.213.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.213.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.214.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.214.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.214.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.215.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.215.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.215.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.216.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.216.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.216.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.217.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.217.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.217.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.218.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.218.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.218.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.219.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.219.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.219.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.220.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.220.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.220.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.221.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.221.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.221.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.222.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.222.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.222.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.223.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.223.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.223.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.224.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.224.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.224.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.225.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.225.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.225.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.226.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.226.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.226.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.227.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.227.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.227.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.228.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.228.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.228.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.229.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.229.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.229.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.230.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.230.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.230.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.231.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.231.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.231.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.232.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.232.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.232.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.233.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.233.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.233.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.234.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.234.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.234.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.235.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.235.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.235.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.236.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.236.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.236.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.237.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.237.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.237.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.238.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.238.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.238.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.239.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.239.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.239.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.240.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.240.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.240.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.241.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.241.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.241.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.242.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.242.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.242.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.243.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.243.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.243.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.244.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.244.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.244.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.245.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.245.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.245.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.246.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.246.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.246.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.247.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.247.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.247.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.248.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.248.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.248.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.249.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.249.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.249.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.250.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.250.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.250.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.251.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.251.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.251.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.252.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.252.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.252.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.253.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.253.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.253.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.254.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.254.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.254.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.255.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.255.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.255.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.input_layernorm.weight": "model-00100-of-000163.safetensors", + "model.layers.38.post_attention_layernorm.weight": "model-00100-of-000163.safetensors", + "model.layers.39.self_attn.q_a_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.self_attn.q_a_layernorm.weight": "model-00101-of-000163.safetensors", + "model.layers.39.self_attn.q_b_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.self_attn.kv_a_proj_with_mqa.weight": "model-00101-of-000163.safetensors", + "model.layers.39.self_attn.kv_a_layernorm.weight": "model-00101-of-000163.safetensors", + "model.layers.39.self_attn.kv_b_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.self_attn.o_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.gate.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.gate.e_score_correction_bias": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.shared_experts.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.shared_experts.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.shared_experts.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.0.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.0.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.0.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.1.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.1.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.1.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.2.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.2.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.2.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.3.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.3.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.3.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.4.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.4.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.4.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.5.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.5.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.5.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.6.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.6.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.6.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.7.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.7.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.7.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.8.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.8.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.8.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.9.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.9.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.9.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.10.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.10.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.10.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.11.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.11.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.11.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.12.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.12.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.12.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.13.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.13.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.13.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.14.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.14.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.14.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.15.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.15.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.15.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.16.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.16.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.16.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.17.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.17.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.17.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.18.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.18.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.18.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.19.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.19.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.19.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.20.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.20.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.20.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.21.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.21.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.21.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.22.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.22.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.22.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.23.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.23.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.23.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.24.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.24.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.24.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.25.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.25.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.25.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.26.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.26.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.26.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.27.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.27.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.27.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.28.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.28.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.28.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.29.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.29.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.29.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.30.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.30.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.30.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.31.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.31.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.31.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.32.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.32.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.32.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.33.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.33.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.33.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.34.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.34.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.34.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.35.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.35.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.35.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.36.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.36.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.36.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.37.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.37.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.37.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.38.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.38.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.38.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.39.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.39.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.39.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.40.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.40.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.40.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.41.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.41.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.41.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.42.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.42.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.42.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.43.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.43.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.43.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.44.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.44.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.44.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.45.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.45.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.45.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.46.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.46.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.46.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.47.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.47.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.47.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.48.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.48.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.48.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.49.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.49.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.49.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.50.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.50.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.50.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.51.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.51.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.51.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.52.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.52.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.52.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.53.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.53.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.53.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.54.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.54.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.54.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.55.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.55.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.55.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.56.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.56.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.56.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.57.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.57.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.57.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.58.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.58.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.58.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.59.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.59.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.59.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.60.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.60.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.60.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.61.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.61.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.61.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.62.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.62.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.62.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.63.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.63.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.63.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.64.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.64.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.64.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.65.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.65.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.65.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.66.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.66.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.66.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.67.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.67.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.67.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.68.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.68.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.68.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.69.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.69.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.69.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.70.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.70.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.70.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.71.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.71.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.71.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.72.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.72.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.72.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.73.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.73.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.73.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.74.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.74.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.74.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.75.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.75.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.75.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.76.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.76.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.76.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.77.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.77.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.77.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.78.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.78.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.78.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.79.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.79.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.79.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.80.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.80.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.80.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.81.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.81.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.81.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.82.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.82.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.82.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.83.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.83.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.83.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.84.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.84.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.84.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.85.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.85.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.85.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.86.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.86.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.86.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.87.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.87.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.87.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.88.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.88.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.88.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.89.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.89.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.89.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.90.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.90.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.90.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.91.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.91.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.91.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.92.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.92.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.92.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.93.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.93.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.93.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.94.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.94.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.94.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.95.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.95.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.95.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.96.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.96.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.96.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.97.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.97.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.97.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.98.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.98.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.98.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.99.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.99.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.99.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.100.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.100.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.100.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.101.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.101.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.101.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.102.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.102.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.102.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.103.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.103.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.103.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.104.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.104.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.104.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.105.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.105.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.105.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.106.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.106.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.106.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.107.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.107.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.107.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.108.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.108.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.108.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.109.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.109.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.109.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.110.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.110.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.110.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.111.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.111.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.111.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.112.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.112.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.112.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.113.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.113.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.113.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.114.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.114.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.114.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.115.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.115.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.115.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.116.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.116.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.116.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.117.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.117.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.117.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.118.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.118.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.118.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.119.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.119.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.119.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.120.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.120.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.120.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.121.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.121.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.121.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.122.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.122.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.122.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.123.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.123.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.123.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.124.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.124.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.124.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.125.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.125.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.125.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.126.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.126.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.126.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.127.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.127.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.127.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.128.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.128.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.128.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.129.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.129.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.129.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.130.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.130.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.130.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.131.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.131.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.131.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.132.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.132.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.132.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.133.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.133.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.133.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.134.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.134.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.134.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.135.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.135.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.135.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.136.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.136.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.136.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.137.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.137.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.137.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.138.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.138.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.138.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.139.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.139.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.139.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.140.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.140.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.140.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.141.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.141.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.141.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.142.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.142.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.142.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.143.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.143.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.143.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.144.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.144.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.144.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.145.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.145.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.145.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.146.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.146.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.146.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.147.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.147.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.147.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.148.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.148.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.148.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.149.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.149.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.149.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.150.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.150.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.150.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.151.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.151.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.151.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.152.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.152.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.152.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.153.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.153.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.153.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.154.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.154.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.154.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.155.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.155.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.155.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.156.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.156.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.156.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.157.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.157.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.157.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.158.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.158.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.158.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.159.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.159.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.159.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.160.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.160.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.160.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.161.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.161.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.161.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.162.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.162.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.162.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.163.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.163.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.163.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.164.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.164.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.164.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.165.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.165.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.165.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.166.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.166.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.166.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.167.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.167.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.167.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.168.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.168.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.168.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.169.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.169.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.169.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.170.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.170.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.170.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.171.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.171.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.171.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.172.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.172.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.172.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.173.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.173.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.173.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.174.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.174.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.174.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.175.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.175.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.175.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.176.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.176.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.176.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.177.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.177.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.177.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.178.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.178.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.178.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.179.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.179.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.179.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.180.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.180.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.180.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.181.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.181.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.181.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.182.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.182.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.182.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.183.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.183.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.183.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.184.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.184.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.184.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.185.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.185.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.185.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.186.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.186.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.186.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.187.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.187.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.187.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.188.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.188.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.188.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.189.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.189.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.189.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.190.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.190.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.190.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.191.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.191.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.191.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.192.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.192.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.192.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.193.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.193.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.193.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.194.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.194.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.194.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.195.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.195.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.195.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.196.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.196.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.196.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.197.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.197.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.197.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.198.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.198.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.198.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.199.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.199.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.199.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.200.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.200.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.200.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.201.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.201.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.201.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.202.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.202.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.202.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.203.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.203.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.203.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.204.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.204.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.204.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.205.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.205.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.205.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.206.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.206.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.206.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.207.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.207.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.207.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.208.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.208.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.208.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.209.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.209.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.209.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.210.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.210.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.210.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.211.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.211.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.211.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.212.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.212.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.212.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.213.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.213.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.213.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.214.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.214.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.214.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.215.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.215.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.215.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.216.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.216.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.216.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.217.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.217.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.217.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.218.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.218.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.218.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.219.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.219.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.219.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.220.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.220.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.220.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.221.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.221.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.221.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.222.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.222.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.222.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.223.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.223.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.223.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.224.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.224.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.224.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.225.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.225.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.225.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.226.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.226.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.226.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.227.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.227.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.227.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.228.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.228.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.228.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.229.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.229.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.229.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.230.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.230.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.230.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.231.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.231.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.231.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.232.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.232.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.232.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.233.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.233.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.233.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.234.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.234.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.234.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.235.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.235.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.235.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.236.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.236.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.236.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.237.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.237.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.237.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.238.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.238.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.238.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.239.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.239.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.239.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.240.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.240.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.240.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.241.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.241.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.241.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.242.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.242.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.242.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.243.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.243.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.243.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.244.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.244.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.244.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.245.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.245.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.245.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.246.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.246.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.246.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.247.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.247.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.247.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.248.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.248.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.248.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.249.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.249.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.249.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.250.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.250.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.250.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.251.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.251.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.251.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.252.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.252.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.252.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.253.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.253.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.253.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.254.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.254.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.254.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.255.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.255.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.255.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.input_layernorm.weight": "model-00103-of-000163.safetensors", + "model.layers.39.post_attention_layernorm.weight": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.q_a_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.q_a_layernorm.weight": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.q_b_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.kv_a_proj_with_mqa.weight": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.kv_a_layernorm.weight": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.kv_b_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.o_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.gate.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.gate.e_score_correction_bias": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.shared_experts.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.shared_experts.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.shared_experts.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.0.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.0.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.0.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.1.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.1.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.1.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.2.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.2.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.2.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.3.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.3.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.3.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.4.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.4.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.4.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.5.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.5.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.5.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.6.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.6.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.6.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.7.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.7.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.7.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.8.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.8.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.8.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.9.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.9.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.9.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.10.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.10.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.10.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.11.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.11.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.11.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.12.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.12.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.12.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.13.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.13.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.13.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.14.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.14.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.14.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.15.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.15.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.15.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.16.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.16.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.16.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.17.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.17.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.17.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.18.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.18.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.18.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.19.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.19.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.19.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.20.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.20.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.20.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.21.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.21.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.21.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.22.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.22.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.22.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.23.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.23.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.23.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.24.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.24.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.24.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.25.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.25.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.25.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.26.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.26.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.26.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.27.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.27.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.27.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.28.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.28.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.28.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.29.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.29.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.29.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.30.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.30.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.30.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.31.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.31.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.31.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.32.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.32.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.32.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.33.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.33.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.33.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.34.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.34.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.34.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.35.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.35.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.35.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.36.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.36.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.36.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.37.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.37.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.37.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.38.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.38.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.38.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.39.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.39.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.39.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.40.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.40.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.40.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.41.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.41.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.41.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.42.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.42.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.42.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.43.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.43.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.43.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.44.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.44.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.44.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.45.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.45.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.45.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.46.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.46.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.46.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.47.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.47.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.47.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.48.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.48.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.48.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.49.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.49.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.49.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.50.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.50.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.50.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.51.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.51.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.51.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.52.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.52.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.52.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.53.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.53.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.53.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.54.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.54.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.54.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.55.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.55.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.55.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.56.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.56.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.56.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.57.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.57.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.57.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.58.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.58.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.58.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.59.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.59.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.59.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.60.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.60.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.60.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.61.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.61.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.61.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.62.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.62.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.62.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.63.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.63.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.63.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.64.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.64.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.64.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.65.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.65.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.65.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.66.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.66.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.66.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.67.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.67.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.67.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.68.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.68.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.68.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.69.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.69.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.69.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.70.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.70.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.70.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.71.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.71.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.71.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.72.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.72.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.72.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.73.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.73.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.73.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.74.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.74.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.74.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.75.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.75.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.75.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.76.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.76.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.76.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.77.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.77.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.77.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.78.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.78.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.78.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.79.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.79.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.79.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.80.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.80.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.80.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.81.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.81.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.81.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.82.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.82.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.82.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.83.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.83.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.83.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.84.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.84.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.84.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.85.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.85.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.85.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.86.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.86.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.86.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.87.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.87.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.87.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.88.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.88.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.88.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.89.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.89.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.89.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.90.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.90.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.90.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.91.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.91.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.91.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.92.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.92.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.92.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.93.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.93.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.93.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.94.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.94.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.94.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.95.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.95.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.95.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.96.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.96.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.96.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.97.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.97.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.97.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.98.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.98.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.98.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.99.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.99.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.99.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.100.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.100.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.100.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.101.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.101.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.101.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.102.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.102.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.102.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.103.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.103.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.103.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.104.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.104.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.104.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.105.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.105.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.105.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.106.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.106.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.106.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.107.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.107.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.107.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.108.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.108.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.108.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.109.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.109.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.109.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.110.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.110.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.110.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.111.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.111.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.111.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.112.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.112.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.112.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.113.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.113.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.113.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.114.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.114.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.114.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.115.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.115.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.115.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.116.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.116.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.116.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.117.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.117.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.117.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.118.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.118.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.118.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.119.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.119.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.119.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.120.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.120.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.120.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.121.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.121.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.121.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.122.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.122.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.122.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.123.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.123.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.123.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.124.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.124.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.124.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.125.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.125.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.125.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.126.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.126.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.126.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.127.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.127.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.127.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.128.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.128.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.128.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.129.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.129.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.129.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.130.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.130.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.130.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.131.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.131.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.131.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.132.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.132.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.132.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.133.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.133.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.133.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.134.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.134.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.134.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.135.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.135.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.135.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.136.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.136.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.136.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.137.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.137.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.137.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.138.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.138.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.138.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.139.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.139.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.139.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.140.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.140.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.140.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.141.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.141.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.141.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.142.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.142.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.142.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.143.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.143.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.143.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.144.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.144.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.144.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.145.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.145.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.145.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.146.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.146.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.146.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.147.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.147.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.147.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.148.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.148.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.148.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.149.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.149.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.149.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.150.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.150.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.150.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.151.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.151.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.151.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.152.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.152.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.152.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.153.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.153.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.153.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.154.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.154.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.154.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.155.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.155.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.155.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.156.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.156.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.156.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.157.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.157.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.157.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.158.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.158.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.158.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.159.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.159.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.159.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.160.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.160.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.160.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.161.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.161.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.161.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.162.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.162.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.162.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.163.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.163.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.163.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.164.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.164.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.164.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.165.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.165.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.165.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.166.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.166.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.166.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.167.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.167.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.167.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.168.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.168.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.168.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.169.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.169.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.169.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.170.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.170.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.170.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.171.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.171.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.171.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.172.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.172.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.172.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.173.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.173.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.173.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.174.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.174.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.174.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.175.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.175.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.175.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.176.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.176.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.176.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.177.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.177.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.177.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.178.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.178.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.178.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.179.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.179.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.179.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.180.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.180.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.180.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.181.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.181.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.181.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.182.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.182.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.182.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.183.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.183.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.183.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.184.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.184.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.184.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.185.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.185.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.185.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.186.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.186.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.186.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.187.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.187.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.187.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.188.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.188.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.188.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.189.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.189.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.189.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.190.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.190.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.190.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.191.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.191.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.191.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.192.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.192.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.192.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.193.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.193.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.193.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.194.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.194.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.194.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.195.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.195.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.195.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.196.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.196.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.196.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.197.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.197.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.197.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.198.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.198.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.198.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.199.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.199.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.199.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.200.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.200.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.200.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.201.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.201.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.201.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.202.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.202.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.202.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.203.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.203.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.203.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.204.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.204.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.204.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.205.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.205.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.205.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.206.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.206.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.206.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.207.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.207.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.207.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.208.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.208.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.208.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.209.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.209.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.209.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.210.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.210.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.210.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.211.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.211.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.211.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.212.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.212.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.212.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.213.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.213.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.213.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.214.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.214.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.214.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.215.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.215.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.215.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.216.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.216.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.216.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.217.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.217.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.217.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.218.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.218.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.218.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.219.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.219.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.219.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.220.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.220.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.220.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.221.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.221.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.221.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.222.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.222.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.222.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.223.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.223.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.223.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.224.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.224.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.224.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.225.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.225.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.225.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.226.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.226.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.226.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.227.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.227.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.227.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.228.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.228.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.228.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.229.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.229.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.229.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.230.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.230.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.230.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.231.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.231.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.231.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.232.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.232.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.232.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.233.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.233.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.233.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.234.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.234.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.234.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.235.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.235.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.235.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.236.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.236.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.236.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.237.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.237.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.237.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.238.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.238.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.238.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.239.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.239.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.239.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.240.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.240.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.240.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.241.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.241.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.241.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.242.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.242.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.242.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.243.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.243.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.243.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.244.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.244.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.244.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.245.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.245.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.245.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.246.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.246.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.246.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.247.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.247.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.247.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.248.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.248.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.248.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.249.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.249.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.249.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.250.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.250.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.250.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.251.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.251.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.251.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.252.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.252.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.252.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.253.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.253.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.253.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.254.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.254.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.254.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.255.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.255.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.255.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.input_layernorm.weight": "model-00106-of-000163.safetensors", + "model.layers.40.post_attention_layernorm.weight": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.q_a_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.q_a_layernorm.weight": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.q_b_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.kv_a_proj_with_mqa.weight": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.kv_a_layernorm.weight": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.kv_b_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.o_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.gate.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.gate.e_score_correction_bias": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.shared_experts.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.shared_experts.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.shared_experts.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.0.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.0.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.0.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.1.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.1.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.1.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.2.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.2.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.2.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.3.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.3.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.3.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.4.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.4.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.4.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.5.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.5.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.5.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.6.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.6.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.6.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.7.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.7.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.7.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.8.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.8.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.8.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.9.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.9.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.9.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.10.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.10.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.10.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.11.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.11.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.11.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.12.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.12.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.12.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.13.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.13.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.13.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.14.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.14.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.14.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.15.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.15.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.15.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.16.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.16.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.16.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.17.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.17.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.17.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.18.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.18.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.18.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.19.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.19.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.19.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.20.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.20.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.20.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.21.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.21.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.21.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.22.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.22.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.22.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.23.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.23.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.23.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.24.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.24.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.24.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.25.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.25.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.25.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.26.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.26.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.26.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.27.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.27.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.27.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.28.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.28.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.28.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.29.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.29.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.29.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.30.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.30.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.30.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.31.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.31.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.31.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.32.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.32.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.32.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.33.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.33.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.33.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.34.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.34.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.34.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.35.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.35.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.35.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.36.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.36.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.36.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.37.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.37.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.37.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.38.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.38.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.38.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.39.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.39.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.39.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.40.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.40.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.40.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.41.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.41.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.41.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.42.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.42.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.42.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.43.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.43.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.43.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.44.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.44.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.44.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.45.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.45.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.45.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.46.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.46.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.46.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.47.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.47.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.47.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.48.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.48.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.48.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.49.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.49.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.49.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.50.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.50.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.50.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.51.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.51.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.51.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.52.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.52.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.52.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.53.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.53.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.53.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.54.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.54.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.54.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.55.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.55.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.55.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.56.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.56.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.56.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.57.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.57.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.57.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.58.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.58.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.58.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.59.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.59.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.59.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.60.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.60.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.60.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.61.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.61.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.61.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.62.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.62.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.62.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.63.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.63.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.63.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.64.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.64.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.64.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.65.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.65.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.65.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.66.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.66.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.66.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.67.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.67.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.67.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.68.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.68.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.68.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.69.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.69.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.69.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.70.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.70.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.70.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.71.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.71.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.71.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.72.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.72.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.72.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.73.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.73.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.73.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.74.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.74.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.74.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.75.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.75.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.75.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.76.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.76.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.76.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.77.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.77.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.77.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.78.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.78.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.78.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.79.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.79.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.79.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.80.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.80.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.80.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.81.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.81.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.81.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.82.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.82.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.82.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.83.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.83.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.83.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.84.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.84.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.84.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.85.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.85.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.85.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.86.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.86.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.86.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.87.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.87.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.87.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.88.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.88.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.88.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.89.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.89.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.89.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.90.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.90.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.90.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.91.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.91.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.91.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.92.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.92.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.92.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.93.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.93.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.93.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.94.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.94.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.94.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.95.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.95.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.95.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.96.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.96.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.96.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.97.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.97.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.97.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.98.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.98.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.98.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.99.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.99.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.99.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.100.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.100.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.100.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.101.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.101.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.101.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.102.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.102.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.102.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.103.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.103.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.103.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.104.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.104.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.104.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.105.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.105.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.105.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.106.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.106.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.106.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.107.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.107.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.107.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.108.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.108.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.108.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.109.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.109.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.109.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.110.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.110.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.110.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.111.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.111.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.111.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.112.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.112.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.112.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.113.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.113.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.113.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.114.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.114.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.114.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.115.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.115.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.115.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.116.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.116.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.116.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.117.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.117.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.117.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.118.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.118.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.118.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.119.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.119.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.119.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.120.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.120.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.120.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.121.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.121.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.121.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.122.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.122.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.122.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.123.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.123.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.123.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.124.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.124.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.124.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.125.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.125.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.125.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.126.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.126.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.126.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.127.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.127.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.127.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.128.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.128.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.128.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.129.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.129.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.129.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.130.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.130.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.130.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.131.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.131.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.131.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.132.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.132.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.132.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.133.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.133.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.133.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.134.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.134.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.134.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.135.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.135.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.135.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.136.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.136.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.136.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.137.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.137.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.137.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.138.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.138.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.138.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.139.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.139.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.139.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.140.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.140.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.140.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.141.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.141.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.141.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.142.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.142.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.142.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.143.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.143.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.143.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.144.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.144.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.144.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.145.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.145.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.145.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.146.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.146.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.146.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.147.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.147.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.147.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.148.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.148.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.148.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.149.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.149.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.149.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.150.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.150.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.150.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.151.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.151.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.151.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.152.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.152.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.152.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.153.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.153.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.153.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.154.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.154.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.154.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.155.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.155.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.155.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.156.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.156.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.156.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.157.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.157.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.157.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.158.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.158.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.158.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.159.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.159.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.159.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.160.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.160.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.160.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.161.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.161.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.161.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.162.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.162.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.162.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.163.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.163.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.163.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.164.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.164.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.164.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.165.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.165.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.165.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.166.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.166.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.166.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.167.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.167.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.167.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.168.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.168.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.168.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.169.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.169.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.169.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.170.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.170.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.170.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.171.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.171.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.171.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.172.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.172.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.172.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.173.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.173.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.173.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.174.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.174.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.174.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.175.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.175.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.175.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.176.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.176.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.176.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.177.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.177.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.177.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.178.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.178.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.178.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.179.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.179.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.179.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.180.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.180.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.180.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.181.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.181.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.181.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.182.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.182.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.182.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.183.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.183.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.183.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.184.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.184.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.184.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.185.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.185.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.185.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.186.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.186.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.186.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.187.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.187.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.187.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.188.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.188.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.188.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.189.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.189.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.189.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.190.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.190.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.190.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.191.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.191.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.191.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.192.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.192.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.192.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.193.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.193.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.193.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.194.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.194.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.194.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.195.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.195.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.195.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.196.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.196.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.196.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.197.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.197.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.197.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.198.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.198.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.198.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.199.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.199.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.199.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.200.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.200.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.200.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.201.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.201.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.201.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.202.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.202.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.202.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.203.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.203.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.203.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.204.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.204.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.204.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.205.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.205.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.205.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.206.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.206.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.206.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.207.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.207.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.207.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.208.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.208.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.208.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.209.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.209.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.209.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.210.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.210.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.210.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.211.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.211.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.211.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.212.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.212.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.212.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.213.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.213.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.213.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.214.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.214.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.214.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.215.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.215.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.215.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.216.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.216.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.216.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.217.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.217.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.217.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.218.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.218.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.218.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.219.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.219.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.219.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.220.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.220.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.220.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.221.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.221.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.221.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.222.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.222.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.222.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.223.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.223.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.223.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.224.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.224.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.224.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.225.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.225.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.225.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.226.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.226.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.226.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.227.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.227.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.227.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.228.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.228.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.228.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.229.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.229.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.229.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.230.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.230.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.230.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.231.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.231.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.231.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.232.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.232.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.232.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.233.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.233.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.233.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.234.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.234.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.234.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.235.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.235.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.235.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.236.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.236.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.236.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.237.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.237.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.237.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.238.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.238.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.238.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.239.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.239.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.239.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.240.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.240.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.240.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.241.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.241.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.241.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.242.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.242.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.242.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.243.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.243.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.243.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.244.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.244.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.244.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.245.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.245.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.245.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.246.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.246.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.246.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.247.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.247.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.247.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.248.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.248.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.248.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.249.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.249.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.249.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.250.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.250.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.250.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.251.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.251.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.251.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.252.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.252.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.252.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.253.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.253.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.253.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.254.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.254.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.254.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.255.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.255.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.255.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.41.input_layernorm.weight": "model-00109-of-000163.safetensors", + "model.layers.41.post_attention_layernorm.weight": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.q_a_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.q_a_layernorm.weight": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.q_b_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.kv_a_proj_with_mqa.weight": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.kv_a_layernorm.weight": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.kv_b_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.o_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.gate.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.gate.e_score_correction_bias": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.shared_experts.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.shared_experts.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.shared_experts.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.0.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.0.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.0.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.1.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.1.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.1.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.2.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.2.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.2.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.3.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.3.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.3.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.4.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.4.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.4.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.5.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.5.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.5.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.6.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.6.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.6.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.7.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.7.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.7.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.8.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.8.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.8.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.9.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.9.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.9.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.10.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.10.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.10.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.11.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.11.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.11.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.12.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.12.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.12.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.13.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.13.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.13.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.14.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.14.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.14.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.15.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.15.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.15.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.16.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.16.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.16.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.17.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.17.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.17.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.18.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.18.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.18.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.19.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.19.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.19.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.20.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.20.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.20.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.21.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.21.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.21.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.22.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.22.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.22.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.23.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.23.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.23.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.24.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.24.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.24.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.25.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.25.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.25.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.26.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.26.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.26.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.27.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.27.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.27.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.28.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.28.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.28.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.29.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.29.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.29.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.30.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.30.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.30.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.31.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.31.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.31.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.32.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.32.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.32.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.33.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.33.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.33.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.34.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.34.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.34.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.35.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.35.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.35.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.36.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.36.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.36.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.37.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.37.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.37.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.38.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.38.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.38.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.39.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.39.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.39.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.40.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.40.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.40.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.41.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.41.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.41.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.42.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.42.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.42.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.43.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.43.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.43.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.44.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.44.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.44.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.45.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.45.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.45.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.46.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.46.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.46.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.47.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.47.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.47.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.48.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.48.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.48.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.49.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.49.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.49.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.50.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.50.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.50.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.51.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.51.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.51.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.52.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.52.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.52.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.53.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.53.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.53.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.54.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.54.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.54.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.55.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.55.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.55.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.56.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.56.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.56.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.57.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.57.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.57.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.58.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.58.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.58.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.59.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.59.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.59.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.60.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.60.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.60.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.61.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.61.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.61.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.62.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.62.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.62.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.63.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.63.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.63.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.64.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.64.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.64.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.65.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.65.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.65.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.66.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.66.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.66.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.67.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.67.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.67.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.68.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.68.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.68.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.69.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.69.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.69.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.70.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.70.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.70.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.71.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.71.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.71.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.72.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.72.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.72.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.73.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.73.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.73.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.74.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.74.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.74.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.75.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.75.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.75.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.76.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.76.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.76.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.77.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.77.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.77.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.78.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.78.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.78.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.79.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.79.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.79.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.80.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.80.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.80.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.81.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.81.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.81.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.82.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.82.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.82.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.83.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.83.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.83.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.84.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.84.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.84.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.85.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.85.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.85.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.86.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.86.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.86.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.87.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.87.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.87.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.88.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.88.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.88.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.89.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.89.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.89.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.90.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.90.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.90.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.91.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.91.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.91.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.92.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.92.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.92.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.93.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.93.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.93.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.94.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.94.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.94.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.95.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.95.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.95.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.96.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.96.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.96.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.97.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.97.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.97.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.98.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.98.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.98.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.99.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.99.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.99.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.100.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.100.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.100.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.101.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.101.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.101.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.102.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.102.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.102.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.103.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.103.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.103.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.104.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.104.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.104.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.105.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.105.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.105.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.106.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.106.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.106.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.107.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.107.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.107.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.108.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.108.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.108.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.109.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.109.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.109.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.110.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.110.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.110.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.111.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.111.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.111.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.112.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.112.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.112.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.113.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.113.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.113.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.114.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.114.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.114.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.115.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.115.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.115.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.116.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.116.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.116.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.117.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.117.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.117.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.118.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.118.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.118.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.119.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.119.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.119.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.120.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.120.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.120.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.121.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.121.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.121.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.122.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.122.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.122.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.123.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.123.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.123.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.124.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.124.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.124.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.125.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.125.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.125.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.126.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.126.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.126.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.127.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.127.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.127.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.128.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.128.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.128.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.129.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.129.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.129.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.130.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.130.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.130.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.131.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.131.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.131.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.132.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.132.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.132.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.133.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.133.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.133.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.134.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.134.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.134.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.135.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.135.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.135.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.136.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.136.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.136.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.137.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.137.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.137.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.138.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.138.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.138.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.139.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.139.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.139.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.140.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.140.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.140.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.141.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.141.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.141.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.142.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.142.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.142.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.143.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.143.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.143.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.144.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.144.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.144.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.145.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.145.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.145.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.146.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.146.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.146.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.147.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.147.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.147.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.148.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.148.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.148.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.149.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.149.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.149.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.150.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.150.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.150.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.151.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.151.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.151.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.152.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.152.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.152.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.153.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.153.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.153.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.154.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.154.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.154.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.155.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.155.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.155.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.156.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.156.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.156.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.157.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.157.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.157.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.158.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.158.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.158.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.159.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.159.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.159.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.160.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.160.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.160.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.161.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.161.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.161.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.162.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.162.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.162.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.163.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.163.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.163.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.164.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.164.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.164.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.165.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.165.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.165.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.166.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.166.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.166.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.167.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.167.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.167.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.168.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.168.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.168.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.169.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.169.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.169.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.170.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.170.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.170.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.171.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.171.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.171.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.172.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.172.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.172.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.173.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.173.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.173.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.174.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.174.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.174.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.175.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.175.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.175.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.176.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.176.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.176.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.177.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.177.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.177.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.178.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.178.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.178.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.179.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.179.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.179.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.180.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.180.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.180.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.181.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.181.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.181.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.182.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.182.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.182.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.183.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.183.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.183.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.184.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.184.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.184.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.185.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.185.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.185.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.186.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.186.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.186.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.187.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.187.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.187.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.188.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.188.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.188.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.189.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.189.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.189.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.190.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.190.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.190.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.191.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.191.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.191.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.192.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.192.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.192.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.193.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.193.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.193.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.194.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.194.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.194.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.195.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.195.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.195.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.196.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.196.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.196.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.197.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.197.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.197.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.198.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.198.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.198.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.199.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.199.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.199.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.200.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.200.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.200.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.201.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.201.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.201.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.202.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.202.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.202.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.203.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.203.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.203.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.204.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.204.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.204.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.205.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.205.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.205.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.206.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.206.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.206.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.207.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.207.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.207.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.208.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.208.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.208.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.209.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.209.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.209.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.210.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.210.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.210.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.211.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.211.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.211.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.212.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.212.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.212.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.213.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.213.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.213.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.214.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.214.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.214.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.215.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.215.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.215.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.216.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.216.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.216.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.217.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.217.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.217.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.218.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.218.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.218.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.219.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.219.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.219.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.220.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.220.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.220.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.221.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.221.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.221.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.222.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.222.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.222.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.223.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.223.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.223.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.224.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.224.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.224.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.225.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.225.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.225.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.226.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.226.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.226.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.227.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.227.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.227.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.228.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.228.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.228.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.229.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.229.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.229.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.230.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.230.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.230.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.231.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.231.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.231.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.232.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.232.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.232.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.233.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.233.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.233.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.234.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.234.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.234.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.235.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.235.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.235.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.236.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.236.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.236.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.237.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.237.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.237.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.238.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.238.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.238.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.239.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.239.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.239.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.240.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.240.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.240.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.241.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.241.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.241.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.242.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.242.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.242.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.243.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.243.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.243.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.244.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.244.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.244.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.245.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.245.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.245.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.246.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.246.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.246.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.247.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.247.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.247.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.248.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.248.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.248.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.249.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.249.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.249.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.250.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.250.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.250.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.251.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.251.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.251.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.252.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.252.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.252.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.253.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.253.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.253.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.254.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.254.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.254.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.255.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.255.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.255.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.input_layernorm.weight": "model-00111-of-000163.safetensors", + "model.layers.42.post_attention_layernorm.weight": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.q_a_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.q_a_layernorm.weight": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.q_b_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.kv_a_proj_with_mqa.weight": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.kv_a_layernorm.weight": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.kv_b_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.o_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.gate.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.gate.e_score_correction_bias": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.shared_experts.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.shared_experts.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.shared_experts.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.0.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.0.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.0.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.1.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.1.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.1.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.2.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.2.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.2.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.3.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.3.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.3.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.4.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.4.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.4.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.5.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.5.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.5.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.6.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.6.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.6.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.7.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.7.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.7.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.8.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.8.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.8.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.9.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.9.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.9.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.10.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.10.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.10.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.11.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.11.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.11.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.12.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.12.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.12.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.13.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.13.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.13.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.14.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.14.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.14.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.15.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.15.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.15.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.16.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.16.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.16.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.17.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.17.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.17.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.18.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.18.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.18.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.19.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.19.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.19.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.20.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.20.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.20.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.21.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.21.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.21.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.22.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.22.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.22.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.23.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.23.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.23.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.24.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.24.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.24.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.25.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.25.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.25.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.26.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.26.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.26.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.27.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.27.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.27.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.28.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.28.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.28.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.29.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.29.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.29.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.30.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.30.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.30.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.31.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.31.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.31.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.32.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.32.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.32.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.33.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.33.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.33.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.34.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.34.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.34.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.35.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.35.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.35.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.36.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.36.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.36.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.37.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.37.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.37.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.38.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.38.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.38.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.39.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.39.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.39.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.40.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.40.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.40.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.41.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.41.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.41.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.42.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.42.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.42.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.43.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.43.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.43.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.44.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.44.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.44.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.45.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.45.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.45.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.46.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.46.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.46.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.47.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.47.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.47.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.48.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.48.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.48.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.49.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.49.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.49.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.50.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.50.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.50.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.51.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.51.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.51.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.52.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.52.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.52.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.53.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.53.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.53.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.54.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.54.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.54.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.55.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.55.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.55.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.56.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.56.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.56.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.57.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.57.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.57.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.58.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.58.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.58.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.59.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.59.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.59.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.60.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.60.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.60.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.61.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.61.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.61.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.62.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.62.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.62.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.63.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.63.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.63.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.64.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.64.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.64.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.65.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.65.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.65.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.66.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.66.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.66.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.67.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.67.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.67.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.68.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.68.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.68.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.69.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.69.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.69.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.70.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.70.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.70.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.71.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.71.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.71.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.72.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.72.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.72.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.73.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.73.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.73.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.74.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.74.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.74.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.75.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.75.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.75.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.76.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.76.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.76.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.77.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.77.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.77.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.78.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.78.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.78.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.79.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.79.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.79.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.80.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.80.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.80.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.81.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.81.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.81.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.82.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.82.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.82.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.83.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.83.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.83.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.84.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.84.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.84.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.85.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.85.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.85.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.86.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.86.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.86.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.87.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.87.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.87.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.88.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.88.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.88.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.89.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.89.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.89.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.90.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.90.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.90.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.91.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.91.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.91.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.92.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.92.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.92.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.93.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.93.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.93.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.94.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.94.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.94.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.95.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.95.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.95.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.96.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.96.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.96.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.97.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.97.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.97.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.98.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.98.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.98.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.99.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.99.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.99.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.100.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.100.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.100.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.101.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.101.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.101.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.102.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.102.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.102.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.103.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.103.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.103.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.104.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.104.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.104.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.105.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.105.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.105.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.106.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.106.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.106.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.107.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.107.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.107.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.108.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.108.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.108.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.109.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.109.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.109.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.110.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.110.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.110.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.111.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.111.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.111.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.112.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.112.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.112.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.113.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.113.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.113.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.114.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.114.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.114.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.115.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.115.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.115.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.116.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.116.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.116.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.117.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.117.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.117.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.118.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.118.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.118.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.119.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.119.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.119.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.120.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.120.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.120.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.121.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.121.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.121.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.122.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.122.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.122.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.123.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.123.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.123.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.124.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.124.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.124.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.125.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.125.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.125.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.126.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.126.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.126.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.127.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.127.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.127.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.128.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.128.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.128.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.129.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.129.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.129.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.130.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.130.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.130.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.131.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.131.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.131.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.132.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.132.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.132.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.133.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.133.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.133.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.134.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.134.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.134.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.135.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.135.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.135.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.136.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.136.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.136.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.137.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.137.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.137.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.138.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.138.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.138.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.139.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.139.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.139.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.140.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.140.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.140.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.141.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.141.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.141.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.142.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.142.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.142.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.143.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.143.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.143.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.144.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.144.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.144.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.145.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.145.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.145.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.146.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.146.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.146.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.147.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.147.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.147.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.148.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.148.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.148.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.149.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.149.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.149.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.150.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.150.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.150.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.151.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.151.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.151.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.152.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.152.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.152.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.153.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.153.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.153.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.154.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.154.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.154.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.155.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.155.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.155.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.156.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.156.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.156.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.157.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.157.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.157.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.158.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.158.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.158.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.159.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.159.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.159.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.160.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.160.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.160.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.161.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.161.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.161.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.162.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.162.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.162.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.163.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.163.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.163.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.164.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.164.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.164.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.165.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.165.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.165.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.166.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.166.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.166.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.167.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.167.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.167.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.168.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.168.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.168.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.169.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.169.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.169.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.170.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.170.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.170.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.171.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.171.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.171.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.172.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.172.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.172.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.173.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.173.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.173.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.174.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.174.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.174.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.175.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.175.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.175.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.176.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.176.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.176.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.177.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.177.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.177.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.178.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.178.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.178.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.179.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.179.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.179.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.180.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.180.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.180.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.181.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.181.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.181.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.182.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.182.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.182.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.183.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.183.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.183.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.184.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.184.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.184.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.185.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.185.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.185.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.186.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.186.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.186.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.187.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.187.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.187.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.188.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.188.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.188.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.189.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.189.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.189.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.190.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.190.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.190.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.191.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.191.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.191.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.192.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.192.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.192.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.193.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.193.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.193.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.194.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.194.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.194.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.195.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.195.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.195.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.196.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.196.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.196.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.197.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.197.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.197.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.198.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.198.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.198.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.199.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.199.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.199.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.200.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.200.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.200.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.201.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.201.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.201.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.202.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.202.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.202.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.203.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.203.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.203.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.204.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.204.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.204.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.205.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.205.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.205.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.206.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.206.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.206.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.207.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.207.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.207.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.208.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.208.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.208.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.209.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.209.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.209.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.210.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.210.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.210.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.211.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.211.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.211.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.212.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.212.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.212.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.213.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.213.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.213.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.214.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.214.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.214.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.215.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.215.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.215.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.216.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.216.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.216.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.217.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.217.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.217.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.218.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.218.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.218.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.219.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.219.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.219.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.220.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.220.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.220.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.221.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.221.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.221.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.222.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.222.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.222.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.223.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.223.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.223.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.224.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.224.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.224.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.225.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.225.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.225.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.226.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.226.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.226.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.227.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.227.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.227.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.228.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.228.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.228.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.229.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.229.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.229.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.230.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.230.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.230.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.231.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.231.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.231.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.232.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.232.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.232.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.233.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.233.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.233.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.234.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.234.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.234.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.235.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.235.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.235.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.236.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.236.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.236.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.237.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.237.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.237.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.238.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.238.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.238.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.239.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.239.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.239.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.240.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.240.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.240.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.241.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.241.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.241.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.242.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.242.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.242.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.243.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.243.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.243.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.244.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.244.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.244.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.245.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.245.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.245.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.246.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.246.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.246.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.247.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.247.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.247.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.248.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.248.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.248.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.249.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.249.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.249.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.250.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.250.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.250.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.251.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.251.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.251.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.252.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.252.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.252.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.253.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.253.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.253.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.254.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.254.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.254.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.255.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.255.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.255.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.input_layernorm.weight": "model-00114-of-000163.safetensors", + "model.layers.43.post_attention_layernorm.weight": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.q_a_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.q_a_layernorm.weight": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.q_b_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.kv_a_proj_with_mqa.weight": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.kv_a_layernorm.weight": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.kv_b_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.o_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.gate.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.gate.e_score_correction_bias": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.shared_experts.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.shared_experts.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.shared_experts.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.0.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.0.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.0.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.1.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.1.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.1.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.2.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.2.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.2.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.3.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.3.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.3.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.4.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.4.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.4.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.5.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.5.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.5.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.6.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.6.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.6.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.7.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.7.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.7.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.8.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.8.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.8.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.9.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.9.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.9.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.10.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.10.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.10.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.11.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.11.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.11.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.12.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.12.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.12.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.13.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.13.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.13.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.14.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.14.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.14.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.15.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.15.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.15.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.16.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.16.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.16.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.17.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.17.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.17.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.18.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.18.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.18.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.19.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.19.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.19.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.20.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.20.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.20.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.21.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.21.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.21.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.22.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.22.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.22.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.23.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.23.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.23.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.24.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.24.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.24.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.25.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.25.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.25.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.26.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.26.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.26.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.27.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.27.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.27.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.28.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.28.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.28.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.29.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.29.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.29.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.30.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.30.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.30.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.31.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.31.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.31.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.32.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.32.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.32.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.33.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.33.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.33.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.34.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.34.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.34.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.35.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.35.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.35.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.36.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.36.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.36.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.37.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.37.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.37.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.38.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.38.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.38.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.39.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.39.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.39.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.40.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.40.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.40.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.41.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.41.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.41.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.42.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.42.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.42.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.43.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.43.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.43.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.44.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.44.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.44.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.45.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.45.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.45.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.46.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.46.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.46.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.47.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.47.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.47.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.48.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.48.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.48.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.49.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.49.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.49.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.50.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.50.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.50.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.51.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.51.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.51.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.52.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.52.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.52.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.53.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.53.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.53.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.54.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.54.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.54.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.55.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.55.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.55.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.56.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.56.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.56.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.57.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.57.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.57.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.58.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.58.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.58.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.59.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.59.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.59.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.60.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.60.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.60.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.61.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.61.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.61.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.62.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.62.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.62.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.63.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.63.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.63.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.64.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.64.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.64.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.65.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.65.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.65.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.66.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.66.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.66.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.67.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.67.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.67.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.68.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.68.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.68.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.69.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.69.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.69.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.70.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.70.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.70.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.71.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.71.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.71.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.72.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.72.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.72.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.73.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.73.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.73.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.74.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.74.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.74.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.75.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.75.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.75.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.76.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.76.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.76.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.77.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.77.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.77.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.78.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.78.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.78.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.79.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.79.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.79.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.80.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.80.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.80.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.81.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.81.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.81.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.82.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.82.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.82.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.83.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.83.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.83.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.84.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.84.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.84.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.85.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.85.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.85.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.86.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.86.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.86.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.87.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.87.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.87.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.88.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.88.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.88.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.89.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.89.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.89.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.90.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.90.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.90.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.91.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.91.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.91.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.92.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.92.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.92.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.93.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.93.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.93.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.94.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.94.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.94.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.95.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.95.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.95.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.96.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.96.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.96.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.97.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.97.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.97.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.98.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.98.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.98.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.99.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.99.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.99.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.100.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.100.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.100.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.101.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.101.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.101.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.102.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.102.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.102.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.103.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.103.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.103.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.104.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.104.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.104.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.105.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.105.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.105.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.106.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.106.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.106.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.107.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.107.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.107.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.108.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.108.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.108.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.109.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.109.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.109.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.110.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.110.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.110.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.111.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.111.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.111.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.112.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.112.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.112.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.113.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.113.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.113.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.114.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.114.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.114.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.115.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.115.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.115.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.116.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.116.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.116.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.117.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.117.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.117.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.118.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.118.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.118.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.119.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.119.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.119.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.120.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.120.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.120.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.121.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.121.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.121.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.122.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.122.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.122.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.123.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.123.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.123.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.124.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.124.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.124.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.125.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.125.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.125.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.126.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.126.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.126.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.127.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.127.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.127.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.128.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.128.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.128.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.129.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.129.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.129.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.130.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.130.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.130.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.131.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.131.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.131.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.132.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.132.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.132.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.133.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.133.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.133.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.134.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.134.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.134.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.135.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.135.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.135.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.136.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.136.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.136.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.137.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.137.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.137.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.138.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.138.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.138.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.139.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.139.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.139.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.140.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.140.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.140.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.141.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.141.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.141.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.142.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.142.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.142.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.143.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.143.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.143.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.144.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.144.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.144.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.145.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.145.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.145.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.146.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.146.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.146.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.147.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.147.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.147.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.148.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.148.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.148.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.149.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.149.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.149.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.150.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.150.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.150.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.151.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.151.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.151.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.152.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.152.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.152.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.153.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.153.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.153.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.154.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.154.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.154.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.155.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.155.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.155.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.156.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.156.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.156.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.157.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.157.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.157.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.158.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.158.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.158.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.159.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.159.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.159.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.160.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.160.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.160.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.161.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.161.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.161.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.162.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.162.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.162.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.163.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.163.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.163.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.164.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.164.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.164.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.165.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.165.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.165.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.166.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.166.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.166.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.167.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.167.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.167.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.168.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.168.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.168.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.169.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.169.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.169.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.170.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.170.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.170.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.171.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.171.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.171.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.172.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.172.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.172.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.173.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.173.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.173.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.174.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.174.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.174.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.175.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.175.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.175.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.176.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.176.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.176.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.177.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.177.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.177.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.178.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.178.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.178.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.179.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.179.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.179.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.180.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.180.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.180.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.181.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.181.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.181.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.182.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.182.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.182.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.183.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.183.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.183.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.184.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.184.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.184.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.185.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.185.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.185.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.186.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.186.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.186.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.187.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.187.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.187.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.188.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.188.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.188.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.189.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.189.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.189.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.190.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.190.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.190.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.191.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.191.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.191.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.192.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.192.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.192.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.193.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.193.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.193.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.194.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.194.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.194.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.195.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.195.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.195.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.196.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.196.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.196.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.197.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.197.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.197.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.198.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.198.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.198.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.199.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.199.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.199.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.200.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.200.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.200.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.201.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.201.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.201.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.202.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.202.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.202.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.203.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.203.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.203.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.204.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.204.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.204.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.205.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.205.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.205.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.206.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.206.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.206.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.207.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.207.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.207.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.208.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.208.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.208.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.209.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.209.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.209.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.210.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.210.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.210.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.211.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.211.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.211.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.212.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.212.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.212.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.213.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.213.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.213.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.214.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.214.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.214.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.215.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.215.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.215.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.216.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.216.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.216.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.217.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.217.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.217.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.218.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.218.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.218.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.219.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.219.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.219.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.220.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.220.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.220.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.221.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.221.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.221.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.222.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.222.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.222.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.223.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.223.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.223.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.224.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.224.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.224.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.225.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.225.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.225.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.226.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.226.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.226.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.227.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.227.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.227.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.228.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.228.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.228.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.229.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.229.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.229.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.230.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.230.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.230.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.231.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.231.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.231.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.232.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.232.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.232.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.233.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.233.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.233.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.234.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.234.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.234.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.235.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.235.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.235.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.236.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.236.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.236.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.237.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.237.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.237.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.238.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.238.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.238.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.239.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.239.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.239.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.240.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.240.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.240.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.241.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.241.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.241.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.242.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.242.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.242.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.243.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.243.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.243.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.244.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.244.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.244.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.245.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.245.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.245.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.246.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.246.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.246.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.247.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.247.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.247.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.248.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.248.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.248.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.249.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.249.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.249.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.250.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.250.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.250.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.251.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.251.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.251.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.252.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.252.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.252.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.253.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.253.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.253.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.254.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.254.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.254.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.255.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.255.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.255.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.input_layernorm.weight": "model-00117-of-000163.safetensors", + "model.layers.44.post_attention_layernorm.weight": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.q_a_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.q_a_layernorm.weight": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.q_b_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.kv_a_proj_with_mqa.weight": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.kv_a_layernorm.weight": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.kv_b_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.o_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.gate.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.gate.e_score_correction_bias": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.shared_experts.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.shared_experts.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.shared_experts.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.0.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.0.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.0.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.1.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.1.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.1.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.2.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.2.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.2.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.3.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.3.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.3.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.4.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.4.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.4.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.5.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.5.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.5.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.6.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.6.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.6.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.7.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.7.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.7.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.8.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.8.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.8.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.9.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.9.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.9.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.10.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.10.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.10.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.11.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.11.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.11.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.12.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.12.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.12.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.13.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.13.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.13.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.14.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.14.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.14.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.15.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.15.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.15.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.16.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.16.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.16.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.17.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.17.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.17.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.18.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.18.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.18.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.19.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.19.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.19.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.20.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.20.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.20.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.21.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.21.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.21.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.22.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.22.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.22.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.23.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.23.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.23.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.24.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.24.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.24.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.25.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.25.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.25.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.26.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.26.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.26.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.27.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.27.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.27.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.28.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.28.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.28.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.29.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.29.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.29.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.30.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.30.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.30.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.31.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.31.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.31.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.32.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.32.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.32.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.33.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.33.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.33.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.34.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.34.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.34.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.35.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.35.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.35.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.36.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.36.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.36.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.37.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.37.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.37.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.38.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.38.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.38.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.39.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.39.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.39.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.40.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.40.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.40.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.41.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.41.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.41.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.42.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.42.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.42.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.43.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.43.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.43.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.44.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.44.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.44.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.45.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.45.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.45.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.46.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.46.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.46.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.47.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.47.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.47.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.48.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.48.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.48.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.49.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.49.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.49.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.50.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.50.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.50.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.51.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.51.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.51.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.52.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.52.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.52.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.53.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.53.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.53.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.54.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.54.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.54.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.55.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.55.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.55.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.56.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.56.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.56.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.57.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.57.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.57.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.58.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.58.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.58.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.59.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.59.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.59.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.60.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.60.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.60.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.61.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.61.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.61.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.62.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.62.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.62.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.63.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.63.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.63.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.64.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.64.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.64.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.65.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.65.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.65.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.66.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.66.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.66.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.67.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.67.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.67.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.68.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.68.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.68.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.69.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.69.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.69.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.70.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.70.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.70.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.71.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.71.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.71.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.72.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.72.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.72.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.73.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.73.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.73.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.74.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.74.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.74.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.75.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.75.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.75.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.76.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.76.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.76.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.77.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.77.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.77.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.78.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.78.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.78.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.79.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.79.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.79.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.80.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.80.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.80.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.81.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.81.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.81.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.82.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.82.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.82.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.83.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.83.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.83.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.84.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.84.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.84.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.85.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.85.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.85.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.86.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.86.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.86.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.87.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.87.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.87.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.88.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.88.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.88.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.89.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.89.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.89.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.90.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.90.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.90.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.91.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.91.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.91.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.92.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.92.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.92.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.93.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.93.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.93.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.94.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.94.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.94.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.95.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.95.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.95.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.96.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.96.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.96.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.97.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.97.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.97.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.98.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.98.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.98.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.99.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.99.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.99.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.100.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.100.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.100.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.101.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.101.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.101.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.102.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.102.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.102.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.103.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.103.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.103.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.104.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.104.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.104.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.105.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.105.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.105.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.106.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.106.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.106.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.107.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.107.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.107.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.108.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.108.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.108.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.109.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.109.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.109.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.110.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.110.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.110.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.111.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.111.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.111.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.112.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.112.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.112.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.113.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.113.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.113.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.114.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.114.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.114.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.115.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.115.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.115.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.116.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.116.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.116.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.117.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.117.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.117.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.118.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.118.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.118.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.119.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.119.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.119.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.120.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.120.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.120.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.121.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.121.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.121.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.122.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.122.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.122.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.123.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.123.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.123.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.124.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.124.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.124.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.125.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.125.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.125.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.126.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.126.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.126.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.127.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.127.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.127.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.128.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.128.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.128.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.129.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.129.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.129.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.130.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.130.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.130.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.131.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.131.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.131.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.132.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.132.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.132.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.133.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.133.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.133.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.134.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.134.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.134.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.135.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.135.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.135.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.136.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.136.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.136.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.137.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.137.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.137.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.138.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.138.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.138.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.139.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.139.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.139.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.140.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.140.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.140.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.141.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.141.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.141.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.142.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.142.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.142.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.143.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.143.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.143.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.144.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.144.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.144.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.145.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.145.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.145.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.146.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.146.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.146.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.147.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.147.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.147.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.148.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.148.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.148.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.149.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.149.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.149.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.150.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.150.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.150.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.151.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.151.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.151.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.152.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.152.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.152.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.153.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.153.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.153.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.154.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.154.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.154.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.155.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.155.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.155.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.156.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.156.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.156.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.157.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.157.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.157.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.158.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.158.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.158.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.159.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.159.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.159.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.160.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.160.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.160.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.161.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.161.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.161.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.162.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.162.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.162.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.163.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.163.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.163.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.164.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.164.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.164.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.165.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.165.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.165.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.166.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.166.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.166.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.167.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.167.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.167.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.168.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.168.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.168.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.169.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.169.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.169.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.170.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.170.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.170.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.171.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.171.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.171.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.172.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.172.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.172.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.173.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.173.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.173.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.174.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.174.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.174.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.175.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.175.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.175.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.176.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.176.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.176.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.177.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.177.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.177.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.178.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.178.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.178.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.179.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.179.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.179.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.180.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.180.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.180.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.181.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.181.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.181.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.182.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.182.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.182.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.183.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.183.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.183.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.184.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.184.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.184.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.185.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.185.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.185.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.186.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.186.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.186.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.187.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.187.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.187.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.188.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.188.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.188.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.189.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.189.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.189.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.190.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.190.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.190.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.191.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.191.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.191.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.192.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.192.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.192.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.193.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.193.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.193.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.194.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.194.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.194.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.195.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.195.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.195.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.196.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.196.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.196.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.197.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.197.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.197.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.198.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.198.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.198.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.199.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.199.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.199.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.200.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.200.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.200.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.201.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.201.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.201.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.202.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.202.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.202.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.203.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.203.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.203.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.204.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.204.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.204.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.205.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.205.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.205.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.206.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.206.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.206.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.207.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.207.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.207.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.208.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.208.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.208.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.209.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.209.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.209.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.210.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.210.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.210.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.211.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.211.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.211.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.212.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.212.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.212.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.213.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.213.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.213.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.214.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.214.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.214.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.215.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.215.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.215.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.216.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.216.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.216.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.217.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.217.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.217.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.218.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.218.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.218.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.219.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.219.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.219.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.220.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.220.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.220.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.221.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.221.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.221.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.222.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.222.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.222.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.223.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.223.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.223.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.224.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.224.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.224.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.225.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.225.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.225.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.226.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.226.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.226.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.227.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.227.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.227.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.228.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.228.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.228.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.229.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.229.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.229.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.230.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.230.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.230.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.231.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.231.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.231.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.232.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.232.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.232.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.233.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.233.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.233.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.234.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.234.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.234.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.235.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.235.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.235.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.236.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.236.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.236.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.237.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.237.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.237.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.238.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.238.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.238.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.239.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.239.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.239.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.240.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.240.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.240.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.241.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.241.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.241.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.242.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.242.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.242.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.243.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.243.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.243.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.244.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.244.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.244.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.245.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.245.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.245.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.246.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.246.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.246.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.247.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.247.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.247.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.248.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.248.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.248.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.249.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.249.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.249.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.250.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.250.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.250.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.251.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.251.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.251.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.252.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.252.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.252.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.253.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.253.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.253.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.254.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.254.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.254.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.255.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.255.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.255.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.input_layernorm.weight": "model-00119-of-000163.safetensors", + "model.layers.45.post_attention_layernorm.weight": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.q_a_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.q_a_layernorm.weight": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.q_b_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.kv_a_proj_with_mqa.weight": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.kv_a_layernorm.weight": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.kv_b_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.o_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.gate.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.gate.e_score_correction_bias": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.shared_experts.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.shared_experts.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.shared_experts.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.0.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.0.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.0.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.1.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.1.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.1.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.2.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.2.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.2.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.3.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.3.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.3.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.4.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.4.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.4.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.5.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.5.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.5.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.6.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.6.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.6.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.7.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.7.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.7.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.8.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.8.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.8.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.9.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.9.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.9.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.10.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.10.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.10.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.11.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.11.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.11.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.12.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.12.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.12.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.13.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.13.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.13.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.14.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.14.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.14.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.15.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.15.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.15.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.16.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.16.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.16.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.17.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.17.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.17.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.18.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.18.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.18.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.19.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.19.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.19.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.20.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.20.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.20.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.21.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.21.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.21.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.22.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.22.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.22.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.23.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.23.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.23.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.24.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.24.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.24.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.25.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.25.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.25.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.26.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.26.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.26.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.27.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.27.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.27.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.28.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.28.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.28.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.29.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.29.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.29.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.30.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.30.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.30.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.31.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.31.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.31.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.32.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.32.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.32.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.33.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.33.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.33.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.34.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.34.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.34.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.35.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.35.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.35.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.36.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.36.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.36.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.37.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.37.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.37.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.38.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.38.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.38.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.39.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.39.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.39.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.40.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.40.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.40.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.41.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.41.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.41.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.42.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.42.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.42.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.43.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.43.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.43.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.44.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.44.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.44.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.45.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.45.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.45.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.46.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.46.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.46.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.47.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.47.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.47.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.48.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.48.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.48.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.49.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.49.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.49.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.50.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.50.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.50.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.51.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.51.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.51.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.52.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.52.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.52.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.53.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.53.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.53.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.54.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.54.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.54.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.55.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.55.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.55.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.56.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.56.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.56.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.57.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.57.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.57.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.58.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.58.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.58.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.59.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.59.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.59.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.60.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.60.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.60.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.61.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.61.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.61.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.62.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.62.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.62.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.63.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.63.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.63.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.64.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.64.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.64.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.65.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.65.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.65.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.66.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.66.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.66.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.67.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.67.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.67.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.68.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.68.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.68.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.69.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.69.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.69.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.70.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.70.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.70.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.71.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.71.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.71.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.72.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.72.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.72.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.73.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.73.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.73.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.74.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.74.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.74.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.75.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.75.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.75.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.76.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.76.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.76.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.77.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.77.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.77.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.78.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.78.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.78.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.79.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.79.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.79.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.80.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.80.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.80.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.81.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.81.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.81.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.82.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.82.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.82.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.83.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.83.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.83.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.84.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.84.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.84.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.85.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.85.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.85.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.86.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.86.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.86.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.87.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.87.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.87.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.88.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.88.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.88.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.89.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.89.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.89.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.90.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.90.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.90.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.91.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.91.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.91.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.92.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.92.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.92.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.93.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.93.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.93.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.94.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.94.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.94.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.95.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.95.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.95.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.96.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.96.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.96.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.97.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.97.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.97.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.98.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.98.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.98.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.99.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.99.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.99.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.100.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.100.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.100.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.101.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.101.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.101.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.102.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.102.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.102.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.103.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.103.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.103.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.104.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.104.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.104.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.105.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.105.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.105.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.106.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.106.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.106.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.107.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.107.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.107.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.108.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.108.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.108.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.109.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.109.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.109.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.110.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.110.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.110.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.111.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.111.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.111.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.112.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.112.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.112.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.113.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.113.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.113.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.114.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.114.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.114.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.115.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.115.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.115.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.116.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.116.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.116.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.117.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.117.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.117.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.118.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.118.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.118.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.119.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.119.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.119.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.120.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.120.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.120.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.121.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.121.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.121.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.122.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.122.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.122.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.123.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.123.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.123.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.124.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.124.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.124.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.125.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.125.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.125.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.126.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.126.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.126.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.127.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.127.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.127.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.128.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.128.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.128.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.129.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.129.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.129.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.130.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.130.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.130.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.131.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.131.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.131.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.132.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.132.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.132.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.133.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.133.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.133.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.134.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.134.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.134.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.135.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.135.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.135.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.136.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.136.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.136.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.137.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.137.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.137.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.138.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.138.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.138.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.139.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.139.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.139.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.140.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.140.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.140.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.141.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.141.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.141.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.142.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.142.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.142.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.143.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.143.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.143.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.144.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.144.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.144.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.145.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.145.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.145.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.146.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.146.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.146.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.147.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.147.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.147.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.148.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.148.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.148.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.149.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.149.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.149.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.150.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.150.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.150.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.151.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.151.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.151.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.152.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.152.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.152.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.153.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.153.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.153.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.154.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.154.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.154.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.155.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.155.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.155.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.156.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.156.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.156.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.157.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.157.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.157.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.158.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.158.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.158.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.159.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.159.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.159.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.160.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.160.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.160.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.161.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.161.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.161.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.162.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.162.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.162.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.163.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.163.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.163.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.164.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.164.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.164.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.165.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.165.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.165.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.166.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.166.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.166.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.167.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.167.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.167.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.168.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.168.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.168.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.169.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.169.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.169.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.170.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.170.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.170.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.171.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.171.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.171.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.172.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.172.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.172.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.173.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.173.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.173.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.174.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.174.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.174.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.175.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.175.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.175.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.176.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.176.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.176.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.177.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.177.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.177.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.178.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.178.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.178.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.179.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.179.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.179.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.180.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.180.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.180.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.181.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.181.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.181.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.182.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.182.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.182.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.183.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.183.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.183.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.184.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.184.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.184.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.185.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.185.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.185.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.186.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.186.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.186.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.187.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.187.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.187.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.188.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.188.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.188.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.189.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.189.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.189.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.190.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.190.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.190.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.191.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.191.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.191.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.192.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.192.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.192.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.193.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.193.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.193.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.194.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.194.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.194.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.195.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.195.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.195.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.196.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.196.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.196.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.197.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.197.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.197.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.198.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.198.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.198.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.199.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.199.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.199.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.200.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.200.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.200.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.201.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.201.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.201.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.202.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.202.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.202.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.203.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.203.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.203.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.204.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.204.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.204.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.205.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.205.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.205.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.206.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.206.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.206.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.207.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.207.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.207.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.208.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.208.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.208.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.209.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.209.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.209.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.210.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.210.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.210.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.211.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.211.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.211.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.212.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.212.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.212.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.213.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.213.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.213.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.214.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.214.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.214.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.215.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.215.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.215.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.216.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.216.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.216.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.217.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.217.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.217.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.218.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.218.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.218.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.219.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.219.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.219.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.220.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.220.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.220.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.221.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.221.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.221.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.222.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.222.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.222.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.223.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.223.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.223.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.224.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.224.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.224.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.225.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.225.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.225.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.226.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.226.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.226.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.227.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.227.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.227.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.228.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.228.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.228.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.229.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.229.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.229.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.230.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.230.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.230.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.231.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.231.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.231.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.232.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.232.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.232.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.233.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.233.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.233.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.234.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.234.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.234.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.235.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.235.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.235.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.236.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.236.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.236.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.237.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.237.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.237.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.238.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.238.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.238.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.239.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.239.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.239.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.240.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.240.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.240.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.241.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.241.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.241.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.242.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.242.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.242.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.243.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.243.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.243.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.244.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.244.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.244.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.245.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.245.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.245.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.246.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.246.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.246.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.247.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.247.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.247.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.248.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.248.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.248.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.249.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.249.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.249.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.250.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.250.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.250.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.251.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.251.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.251.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.252.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.252.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.252.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.253.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.253.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.253.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.254.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.254.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.254.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.255.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.255.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.255.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.input_layernorm.weight": "model-00122-of-000163.safetensors", + "model.layers.46.post_attention_layernorm.weight": "model-00122-of-000163.safetensors", + "model.layers.47.self_attn.q_a_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.self_attn.q_a_layernorm.weight": "model-00123-of-000163.safetensors", + "model.layers.47.self_attn.q_b_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.self_attn.kv_a_proj_with_mqa.weight": "model-00123-of-000163.safetensors", + "model.layers.47.self_attn.kv_a_layernorm.weight": "model-00123-of-000163.safetensors", + "model.layers.47.self_attn.kv_b_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.self_attn.o_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.gate.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.gate.e_score_correction_bias": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.shared_experts.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.shared_experts.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.shared_experts.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.0.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.0.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.0.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.1.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.1.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.1.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.2.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.2.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.2.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.3.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.3.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.3.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.4.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.4.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.4.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.5.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.5.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.5.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.6.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.6.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.6.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.7.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.7.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.7.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.8.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.8.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.8.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.9.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.9.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.9.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.10.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.10.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.10.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.11.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.11.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.11.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.12.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.12.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.12.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.13.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.13.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.13.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.14.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.14.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.14.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.15.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.15.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.15.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.16.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.16.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.16.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.17.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.17.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.17.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.18.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.18.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.18.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.19.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.19.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.19.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.20.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.20.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.20.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.21.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.21.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.21.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.22.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.22.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.22.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.23.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.23.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.23.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.24.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.24.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.24.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.25.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.25.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.25.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.26.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.26.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.26.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.27.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.27.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.27.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.28.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.28.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.28.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.29.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.29.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.29.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.30.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.30.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.30.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.31.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.31.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.31.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.32.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.32.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.32.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.33.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.33.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.33.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.34.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.34.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.34.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.35.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.35.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.35.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.36.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.36.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.36.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.37.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.37.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.37.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.38.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.38.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.38.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.39.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.39.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.39.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.40.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.40.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.40.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.41.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.41.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.41.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.42.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.42.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.42.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.43.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.43.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.43.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.44.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.44.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.44.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.45.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.45.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.45.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.46.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.46.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.46.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.47.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.47.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.47.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.48.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.48.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.48.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.49.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.49.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.49.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.50.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.50.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.50.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.51.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.51.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.51.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.52.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.52.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.52.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.53.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.53.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.53.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.54.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.54.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.54.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.55.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.55.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.55.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.56.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.56.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.56.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.57.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.57.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.57.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.58.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.58.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.58.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.59.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.59.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.59.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.60.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.60.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.60.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.61.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.61.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.61.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.62.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.62.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.62.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.63.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.63.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.63.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.64.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.64.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.64.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.65.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.65.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.65.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.66.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.66.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.66.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.67.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.67.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.67.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.68.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.68.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.68.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.69.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.69.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.69.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.70.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.70.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.70.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.71.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.71.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.71.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.72.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.72.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.72.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.73.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.73.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.73.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.74.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.74.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.74.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.75.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.75.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.75.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.76.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.76.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.76.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.77.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.77.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.77.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.78.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.78.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.78.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.79.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.79.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.79.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.80.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.80.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.80.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.81.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.81.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.81.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.82.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.82.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.82.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.83.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.83.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.83.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.84.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.84.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.84.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.85.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.85.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.85.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.86.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.86.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.86.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.87.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.87.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.87.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.88.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.88.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.88.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.89.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.89.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.89.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.90.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.90.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.90.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.91.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.91.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.91.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.92.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.92.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.92.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.93.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.93.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.93.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.94.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.94.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.94.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.95.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.95.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.95.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.96.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.96.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.96.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.97.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.97.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.97.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.98.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.98.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.98.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.99.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.99.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.99.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.100.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.100.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.100.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.101.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.101.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.101.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.102.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.102.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.102.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.103.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.103.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.103.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.104.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.104.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.104.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.105.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.105.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.105.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.106.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.106.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.106.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.107.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.107.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.107.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.108.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.108.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.108.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.109.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.109.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.109.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.110.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.110.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.110.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.111.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.111.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.111.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.112.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.112.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.112.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.113.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.113.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.113.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.114.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.114.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.114.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.115.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.115.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.115.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.116.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.116.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.116.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.117.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.117.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.117.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.118.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.118.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.118.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.119.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.119.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.119.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.120.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.120.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.120.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.121.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.121.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.121.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.122.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.122.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.122.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.123.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.123.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.123.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.124.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.124.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.124.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.125.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.125.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.125.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.126.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.126.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.126.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.127.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.127.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.127.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.128.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.128.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.128.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.129.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.129.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.129.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.130.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.130.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.130.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.131.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.131.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.131.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.132.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.132.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.132.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.133.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.133.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.133.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.134.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.134.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.134.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.135.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.135.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.135.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.136.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.136.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.136.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.137.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.137.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.137.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.138.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.138.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.138.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.139.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.139.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.139.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.140.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.140.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.140.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.141.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.141.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.141.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.142.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.142.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.142.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.143.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.143.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.143.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.144.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.144.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.144.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.145.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.145.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.145.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.146.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.146.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.146.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.147.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.147.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.147.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.148.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.148.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.148.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.149.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.149.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.149.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.150.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.150.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.150.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.151.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.151.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.151.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.152.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.152.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.152.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.153.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.153.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.153.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.154.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.154.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.154.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.155.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.155.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.155.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.156.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.156.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.156.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.157.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.157.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.157.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.158.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.158.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.158.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.159.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.159.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.159.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.160.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.160.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.160.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.161.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.161.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.161.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.162.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.162.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.162.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.163.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.163.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.163.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.164.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.164.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.164.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.165.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.165.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.165.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.166.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.166.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.166.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.167.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.167.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.167.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.168.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.168.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.168.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.169.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.169.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.169.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.170.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.170.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.170.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.171.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.171.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.171.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.172.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.172.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.172.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.173.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.173.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.173.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.174.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.174.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.174.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.175.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.175.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.175.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.176.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.176.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.176.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.177.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.177.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.177.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.178.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.178.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.178.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.179.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.179.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.179.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.180.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.180.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.180.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.181.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.181.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.181.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.182.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.182.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.182.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.183.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.183.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.183.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.184.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.184.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.184.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.185.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.185.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.185.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.186.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.186.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.186.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.187.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.187.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.187.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.188.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.188.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.188.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.189.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.189.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.189.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.190.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.190.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.190.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.191.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.191.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.191.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.192.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.192.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.192.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.193.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.193.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.193.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.194.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.194.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.194.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.195.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.195.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.195.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.196.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.196.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.196.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.197.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.197.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.197.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.198.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.198.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.198.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.199.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.199.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.199.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.200.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.200.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.200.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.201.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.201.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.201.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.202.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.202.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.202.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.203.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.203.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.203.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.204.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.204.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.204.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.205.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.205.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.205.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.206.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.206.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.206.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.207.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.207.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.207.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.208.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.208.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.208.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.209.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.209.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.209.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.210.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.210.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.210.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.211.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.211.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.211.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.212.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.212.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.212.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.213.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.213.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.213.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.214.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.214.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.214.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.215.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.215.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.215.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.216.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.216.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.216.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.217.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.217.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.217.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.218.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.218.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.218.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.219.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.219.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.219.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.220.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.220.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.220.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.221.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.221.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.221.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.222.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.222.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.222.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.223.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.223.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.223.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.224.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.224.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.224.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.225.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.225.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.225.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.226.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.226.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.226.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.227.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.227.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.227.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.228.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.228.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.228.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.229.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.229.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.229.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.230.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.230.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.230.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.231.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.231.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.231.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.232.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.232.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.232.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.233.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.233.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.233.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.234.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.234.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.234.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.235.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.235.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.235.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.236.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.236.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.236.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.237.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.237.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.237.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.238.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.238.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.238.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.239.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.239.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.239.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.240.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.240.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.240.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.241.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.241.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.241.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.242.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.242.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.242.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.243.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.243.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.243.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.244.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.244.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.244.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.245.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.245.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.245.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.246.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.246.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.246.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.247.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.247.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.247.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.248.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.248.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.248.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.249.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.249.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.249.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.250.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.250.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.250.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.251.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.251.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.251.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.252.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.252.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.252.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.253.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.253.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.253.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.254.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.254.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.254.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.255.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.255.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.255.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.input_layernorm.weight": "model-00125-of-000163.safetensors", + "model.layers.47.post_attention_layernorm.weight": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.q_a_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.q_a_layernorm.weight": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.q_b_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.kv_a_proj_with_mqa.weight": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.kv_a_layernorm.weight": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.kv_b_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.o_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.gate.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.gate.e_score_correction_bias": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.shared_experts.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.shared_experts.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.shared_experts.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.0.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.0.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.0.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.1.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.1.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.1.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.2.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.2.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.2.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.3.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.3.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.3.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.4.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.4.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.4.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.5.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.5.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.5.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.6.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.6.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.6.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.7.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.7.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.7.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.8.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.8.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.8.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.9.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.9.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.9.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.10.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.10.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.10.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.11.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.11.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.11.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.12.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.12.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.12.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.13.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.13.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.13.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.14.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.14.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.14.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.15.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.15.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.15.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.16.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.16.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.16.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.17.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.17.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.17.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.18.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.18.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.18.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.19.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.19.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.19.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.20.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.20.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.20.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.21.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.21.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.21.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.22.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.22.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.22.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.23.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.23.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.23.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.24.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.24.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.24.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.25.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.25.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.25.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.26.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.26.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.26.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.27.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.27.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.27.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.28.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.28.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.28.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.29.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.29.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.29.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.30.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.30.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.30.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.31.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.31.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.31.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.32.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.32.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.32.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.33.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.33.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.33.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.34.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.34.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.34.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.35.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.35.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.35.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.36.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.36.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.36.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.37.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.37.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.37.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.38.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.38.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.38.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.39.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.39.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.39.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.40.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.40.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.40.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.41.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.41.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.41.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.42.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.42.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.42.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.43.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.43.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.43.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.44.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.44.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.44.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.45.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.45.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.45.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.46.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.46.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.46.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.47.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.47.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.47.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.48.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.48.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.48.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.49.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.49.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.49.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.50.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.50.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.50.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.51.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.51.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.51.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.52.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.52.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.52.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.53.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.53.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.53.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.54.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.54.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.54.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.55.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.55.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.55.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.56.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.56.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.56.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.57.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.57.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.57.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.58.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.58.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.58.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.59.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.59.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.59.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.60.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.60.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.60.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.61.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.61.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.61.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.62.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.62.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.62.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.63.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.63.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.63.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.64.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.64.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.64.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.65.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.65.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.65.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.66.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.66.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.66.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.67.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.67.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.67.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.68.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.68.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.68.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.69.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.69.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.69.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.70.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.70.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.70.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.71.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.71.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.71.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.72.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.72.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.72.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.73.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.73.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.73.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.74.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.74.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.74.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.75.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.75.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.75.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.76.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.76.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.76.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.77.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.77.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.77.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.78.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.78.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.78.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.79.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.79.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.79.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.80.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.80.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.80.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.81.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.81.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.81.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.82.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.82.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.82.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.83.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.83.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.83.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.84.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.84.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.84.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.85.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.85.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.85.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.86.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.86.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.86.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.87.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.87.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.87.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.88.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.88.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.88.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.89.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.89.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.89.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.90.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.90.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.90.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.91.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.91.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.91.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.92.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.92.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.92.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.93.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.93.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.93.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.94.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.94.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.94.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.95.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.95.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.95.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.96.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.96.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.96.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.97.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.97.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.97.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.98.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.98.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.98.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.99.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.99.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.99.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.100.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.100.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.100.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.101.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.101.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.101.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.102.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.102.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.102.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.103.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.103.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.103.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.104.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.104.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.104.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.105.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.105.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.105.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.106.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.106.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.106.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.107.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.107.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.107.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.108.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.108.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.108.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.109.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.109.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.109.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.110.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.110.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.110.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.111.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.111.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.111.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.112.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.112.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.112.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.113.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.113.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.113.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.114.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.114.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.114.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.115.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.115.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.115.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.116.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.116.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.116.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.117.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.117.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.117.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.118.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.118.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.118.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.119.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.119.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.119.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.120.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.120.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.120.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.121.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.121.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.121.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.122.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.122.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.122.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.123.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.123.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.123.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.124.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.124.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.124.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.125.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.125.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.125.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.126.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.126.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.126.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.127.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.127.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.127.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.128.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.128.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.128.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.129.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.129.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.129.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.130.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.130.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.130.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.131.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.131.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.131.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.132.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.132.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.132.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.133.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.133.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.133.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.134.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.134.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.134.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.135.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.135.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.135.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.136.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.136.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.136.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.137.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.137.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.137.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.138.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.138.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.138.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.139.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.139.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.139.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.140.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.140.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.140.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.141.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.141.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.141.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.142.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.142.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.142.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.143.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.143.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.143.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.144.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.144.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.144.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.145.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.145.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.145.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.146.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.146.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.146.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.147.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.147.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.147.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.148.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.148.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.148.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.149.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.149.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.149.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.150.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.150.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.150.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.151.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.151.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.151.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.152.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.152.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.152.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.153.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.153.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.153.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.154.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.154.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.154.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.155.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.155.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.155.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.156.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.156.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.156.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.157.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.157.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.157.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.158.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.158.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.158.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.159.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.159.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.159.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.160.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.160.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.160.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.161.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.161.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.161.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.162.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.162.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.162.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.163.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.163.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.163.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.164.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.164.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.164.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.165.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.165.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.165.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.166.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.166.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.166.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.167.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.167.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.167.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.168.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.168.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.168.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.169.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.169.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.169.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.170.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.170.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.170.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.171.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.171.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.171.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.172.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.172.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.172.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.173.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.173.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.173.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.174.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.174.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.174.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.175.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.175.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.175.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.176.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.176.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.176.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.177.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.177.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.177.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.178.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.178.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.178.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.179.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.179.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.179.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.180.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.180.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.180.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.181.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.181.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.181.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.182.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.182.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.182.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.183.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.183.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.183.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.184.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.184.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.184.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.185.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.185.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.185.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.186.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.186.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.186.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.187.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.187.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.187.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.188.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.188.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.188.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.189.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.189.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.189.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.190.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.190.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.190.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.191.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.191.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.191.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.192.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.192.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.192.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.193.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.193.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.193.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.194.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.194.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.194.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.195.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.195.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.195.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.196.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.196.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.196.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.197.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.197.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.197.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.198.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.198.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.198.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.199.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.199.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.199.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.200.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.200.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.200.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.201.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.201.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.201.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.202.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.202.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.202.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.203.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.203.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.203.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.204.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.204.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.204.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.205.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.205.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.205.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.206.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.206.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.206.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.207.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.207.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.207.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.208.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.208.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.208.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.209.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.209.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.209.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.210.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.210.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.210.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.211.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.211.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.211.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.212.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.212.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.212.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.213.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.213.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.213.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.214.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.214.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.214.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.215.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.215.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.215.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.216.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.216.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.216.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.217.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.217.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.217.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.218.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.218.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.218.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.219.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.219.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.219.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.220.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.220.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.220.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.221.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.221.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.221.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.222.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.222.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.222.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.223.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.223.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.223.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.224.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.224.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.224.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.225.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.225.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.225.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.226.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.226.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.226.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.227.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.227.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.227.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.228.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.228.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.228.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.229.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.229.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.229.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.230.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.230.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.230.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.231.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.231.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.231.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.232.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.232.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.232.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.233.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.233.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.233.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.234.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.234.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.234.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.235.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.235.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.235.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.236.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.236.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.236.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.237.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.237.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.237.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.238.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.238.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.238.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.239.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.239.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.239.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.240.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.240.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.240.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.241.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.241.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.241.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.242.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.242.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.242.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.243.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.243.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.243.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.244.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.244.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.244.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.245.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.245.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.245.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.246.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.246.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.246.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.247.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.247.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.247.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.248.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.248.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.248.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.249.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.249.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.249.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.250.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.250.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.250.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.251.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.251.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.251.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.252.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.252.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.252.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.253.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.253.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.253.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.254.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.254.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.254.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.255.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.255.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.255.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.input_layernorm.weight": "model-00128-of-000163.safetensors", + "model.layers.48.post_attention_layernorm.weight": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.q_a_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.q_a_layernorm.weight": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.q_b_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.kv_a_proj_with_mqa.weight": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.kv_a_layernorm.weight": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.kv_b_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.o_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.gate.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.gate.e_score_correction_bias": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.shared_experts.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.shared_experts.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.shared_experts.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.0.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.0.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.0.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.1.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.1.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.1.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.2.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.2.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.2.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.3.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.3.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.3.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.4.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.4.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.4.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.5.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.5.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.5.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.6.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.6.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.6.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.7.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.7.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.7.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.8.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.8.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.8.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.9.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.9.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.9.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.10.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.10.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.10.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.11.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.11.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.11.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.12.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.12.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.12.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.13.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.13.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.13.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.14.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.14.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.14.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.15.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.15.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.15.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.16.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.16.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.16.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.17.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.17.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.17.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.18.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.18.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.18.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.19.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.19.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.19.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.20.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.20.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.20.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.21.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.21.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.21.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.22.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.22.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.22.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.23.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.23.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.23.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.24.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.24.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.24.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.25.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.25.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.25.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.26.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.26.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.26.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.27.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.27.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.27.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.28.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.28.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.28.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.29.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.29.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.29.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.30.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.30.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.30.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.31.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.31.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.31.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.32.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.32.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.32.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.33.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.33.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.33.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.34.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.34.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.34.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.35.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.35.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.35.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.36.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.36.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.36.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.37.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.37.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.37.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.38.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.38.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.38.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.39.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.39.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.39.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.40.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.40.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.40.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.41.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.41.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.41.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.42.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.42.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.42.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.43.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.43.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.43.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.44.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.44.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.44.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.45.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.45.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.45.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.46.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.46.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.46.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.47.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.47.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.47.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.48.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.48.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.48.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.49.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.49.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.49.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.50.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.50.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.50.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.51.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.51.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.51.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.52.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.52.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.52.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.53.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.53.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.53.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.54.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.54.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.54.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.55.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.55.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.55.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.56.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.56.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.56.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.57.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.57.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.57.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.58.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.58.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.58.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.59.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.59.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.59.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.60.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.60.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.60.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.61.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.61.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.61.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.62.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.62.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.62.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.63.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.63.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.63.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.64.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.64.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.64.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.65.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.65.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.65.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.66.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.66.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.66.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.67.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.67.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.67.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.68.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.68.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.68.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.69.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.69.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.69.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.70.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.70.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.70.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.71.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.71.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.71.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.72.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.72.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.72.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.73.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.73.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.73.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.74.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.74.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.74.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.75.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.75.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.75.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.76.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.76.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.76.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.77.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.77.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.77.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.78.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.78.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.78.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.79.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.79.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.79.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.80.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.80.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.80.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.81.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.81.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.81.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.82.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.82.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.82.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.83.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.83.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.83.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.84.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.84.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.84.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.85.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.85.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.85.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.86.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.86.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.86.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.87.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.87.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.87.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.88.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.88.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.88.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.89.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.89.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.89.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.90.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.90.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.90.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.91.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.91.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.91.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.92.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.92.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.92.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.93.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.93.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.93.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.94.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.94.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.94.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.95.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.95.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.95.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.96.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.96.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.96.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.97.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.97.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.97.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.98.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.98.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.98.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.99.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.99.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.99.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.100.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.100.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.100.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.101.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.101.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.101.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.102.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.102.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.102.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.103.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.103.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.103.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.104.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.104.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.104.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.105.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.105.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.105.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.106.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.106.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.106.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.107.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.107.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.107.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.108.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.108.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.108.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.109.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.109.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.109.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.110.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.110.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.110.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.111.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.111.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.111.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.112.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.112.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.112.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.113.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.113.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.113.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.114.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.114.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.114.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.115.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.115.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.115.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.116.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.116.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.116.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.117.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.117.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.117.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.118.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.118.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.118.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.119.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.119.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.119.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.120.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.120.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.120.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.121.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.121.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.121.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.122.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.122.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.122.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.123.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.123.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.123.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.124.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.124.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.124.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.125.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.125.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.125.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.126.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.126.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.126.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.127.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.127.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.127.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.128.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.128.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.128.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.129.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.129.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.129.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.130.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.130.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.130.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.131.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.131.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.131.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.132.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.132.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.132.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.133.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.133.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.133.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.134.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.134.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.134.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.135.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.135.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.135.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.136.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.136.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.136.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.137.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.137.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.137.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.138.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.138.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.138.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.139.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.139.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.139.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.140.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.140.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.140.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.141.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.141.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.141.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.142.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.142.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.142.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.143.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.143.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.143.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.144.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.144.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.144.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.145.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.145.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.145.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.146.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.146.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.146.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.147.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.147.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.147.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.148.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.148.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.148.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.149.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.149.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.149.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.150.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.150.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.150.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.151.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.151.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.151.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.152.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.152.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.152.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.153.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.153.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.153.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.154.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.154.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.154.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.155.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.155.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.155.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.156.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.156.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.156.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.157.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.157.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.157.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.158.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.158.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.158.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.159.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.159.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.159.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.160.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.160.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.160.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.161.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.161.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.161.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.162.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.162.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.162.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.163.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.163.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.163.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.164.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.164.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.164.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.165.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.165.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.165.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.166.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.166.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.166.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.167.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.167.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.167.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.168.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.168.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.168.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.169.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.169.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.169.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.170.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.170.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.170.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.171.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.171.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.171.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.172.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.172.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.172.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.173.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.173.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.173.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.174.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.174.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.174.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.175.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.175.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.175.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.176.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.176.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.176.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.177.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.177.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.177.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.178.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.178.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.178.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.179.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.179.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.179.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.180.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.180.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.180.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.181.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.181.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.181.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.182.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.182.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.182.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.183.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.183.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.183.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.184.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.184.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.184.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.185.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.185.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.185.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.186.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.186.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.186.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.187.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.187.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.187.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.188.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.188.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.188.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.189.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.189.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.189.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.190.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.190.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.190.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.191.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.191.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.191.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.192.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.192.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.192.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.193.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.193.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.193.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.194.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.194.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.194.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.195.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.195.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.195.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.196.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.196.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.196.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.197.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.197.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.197.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.198.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.198.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.198.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.199.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.199.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.199.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.200.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.200.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.200.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.201.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.201.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.201.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.202.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.202.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.202.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.203.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.203.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.203.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.204.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.204.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.204.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.205.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.205.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.205.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.206.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.206.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.206.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.207.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.207.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.207.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.208.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.208.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.208.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.209.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.209.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.209.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.210.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.210.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.210.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.211.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.211.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.211.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.212.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.212.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.212.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.213.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.213.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.213.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.214.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.214.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.214.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.215.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.215.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.215.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.216.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.216.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.216.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.217.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.217.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.217.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.218.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.218.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.218.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.219.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.219.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.219.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.220.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.220.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.220.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.221.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.221.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.221.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.222.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.222.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.222.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.223.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.223.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.223.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.224.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.224.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.224.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.225.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.225.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.225.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.226.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.226.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.226.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.227.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.227.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.227.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.228.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.228.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.228.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.229.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.229.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.229.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.230.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.230.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.230.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.231.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.231.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.231.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.232.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.232.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.232.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.233.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.233.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.233.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.234.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.234.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.234.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.235.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.235.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.235.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.236.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.236.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.236.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.237.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.237.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.237.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.238.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.238.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.238.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.239.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.239.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.239.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.240.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.240.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.240.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.241.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.241.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.241.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.242.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.242.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.242.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.243.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.243.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.243.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.244.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.244.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.244.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.245.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.245.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.245.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.246.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.246.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.246.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.247.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.247.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.247.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.248.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.248.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.248.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.249.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.249.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.249.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.250.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.250.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.250.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.251.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.251.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.251.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.252.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.252.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.252.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.253.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.253.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.253.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.254.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.254.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.254.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.255.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.255.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.255.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.49.input_layernorm.weight": "model-00131-of-000163.safetensors", + "model.layers.49.post_attention_layernorm.weight": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.q_a_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.q_a_layernorm.weight": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.q_b_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.kv_a_proj_with_mqa.weight": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.kv_a_layernorm.weight": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.kv_b_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.o_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.gate.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.gate.e_score_correction_bias": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.shared_experts.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.shared_experts.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.shared_experts.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.0.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.0.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.0.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.1.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.1.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.1.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.2.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.2.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.2.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.3.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.3.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.3.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.4.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.4.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.4.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.5.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.5.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.5.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.6.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.6.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.6.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.7.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.7.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.7.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.8.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.8.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.8.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.9.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.9.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.9.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.10.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.10.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.10.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.11.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.11.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.11.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.12.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.12.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.12.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.13.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.13.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.13.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.14.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.14.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.14.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.15.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.15.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.15.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.16.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.16.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.16.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.17.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.17.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.17.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.18.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.18.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.18.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.19.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.19.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.19.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.20.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.20.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.20.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.21.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.21.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.21.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.22.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.22.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.22.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.23.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.23.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.23.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.24.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.24.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.24.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.25.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.25.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.25.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.26.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.26.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.26.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.27.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.27.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.27.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.28.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.28.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.28.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.29.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.29.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.29.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.30.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.30.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.30.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.31.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.31.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.31.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.32.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.32.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.32.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.33.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.33.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.33.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.34.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.34.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.34.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.35.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.35.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.35.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.36.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.36.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.36.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.37.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.37.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.37.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.38.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.38.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.38.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.39.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.39.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.39.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.40.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.40.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.40.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.41.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.41.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.41.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.42.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.42.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.42.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.43.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.43.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.43.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.44.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.44.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.44.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.45.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.45.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.45.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.46.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.46.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.46.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.47.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.47.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.47.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.48.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.48.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.48.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.49.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.49.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.49.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.50.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.50.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.50.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.51.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.51.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.51.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.52.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.52.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.52.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.53.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.53.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.53.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.54.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.54.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.54.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.55.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.55.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.55.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.56.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.56.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.56.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.57.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.57.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.57.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.58.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.58.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.58.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.59.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.59.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.59.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.60.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.60.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.60.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.61.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.61.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.61.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.62.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.62.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.62.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.63.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.63.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.63.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.64.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.64.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.64.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.65.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.65.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.65.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.66.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.66.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.66.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.67.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.67.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.67.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.68.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.68.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.68.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.69.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.69.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.69.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.70.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.70.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.70.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.71.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.71.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.71.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.72.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.72.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.72.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.73.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.73.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.73.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.74.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.74.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.74.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.75.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.75.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.75.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.76.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.76.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.76.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.77.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.77.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.77.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.78.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.78.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.78.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.79.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.79.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.79.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.80.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.80.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.80.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.81.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.81.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.81.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.82.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.82.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.82.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.83.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.83.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.83.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.84.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.84.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.84.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.85.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.85.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.85.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.86.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.86.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.86.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.87.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.87.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.87.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.88.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.88.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.88.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.89.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.89.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.89.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.90.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.90.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.90.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.91.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.91.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.91.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.92.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.92.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.92.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.93.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.93.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.93.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.94.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.94.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.94.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.95.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.95.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.95.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.96.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.96.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.96.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.97.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.97.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.97.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.98.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.98.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.98.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.99.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.99.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.99.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.100.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.100.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.100.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.101.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.101.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.101.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.102.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.102.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.102.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.103.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.103.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.103.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.104.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.104.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.104.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.105.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.105.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.105.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.106.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.106.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.106.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.107.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.107.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.107.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.108.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.108.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.108.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.109.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.109.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.109.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.110.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.110.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.110.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.111.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.111.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.111.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.112.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.112.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.112.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.113.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.113.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.113.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.114.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.114.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.114.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.115.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.115.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.115.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.116.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.116.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.116.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.117.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.117.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.117.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.118.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.118.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.118.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.119.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.119.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.119.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.120.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.120.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.120.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.121.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.121.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.121.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.122.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.122.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.122.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.123.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.123.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.123.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.124.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.124.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.124.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.125.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.125.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.125.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.126.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.126.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.126.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.127.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.127.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.127.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.128.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.128.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.128.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.129.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.129.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.129.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.130.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.130.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.130.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.131.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.131.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.131.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.132.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.132.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.132.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.133.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.133.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.133.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.134.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.134.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.134.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.135.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.135.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.135.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.136.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.136.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.136.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.137.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.137.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.137.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.138.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.138.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.138.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.139.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.139.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.139.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.140.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.140.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.140.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.141.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.141.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.141.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.142.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.142.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.142.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.143.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.143.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.143.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.144.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.144.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.144.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.145.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.145.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.145.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.146.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.146.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.146.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.147.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.147.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.147.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.148.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.148.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.148.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.149.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.149.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.149.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.150.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.150.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.150.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.151.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.151.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.151.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.152.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.152.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.152.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.153.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.153.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.153.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.154.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.154.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.154.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.155.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.155.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.155.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.156.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.156.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.156.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.157.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.157.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.157.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.158.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.158.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.158.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.159.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.159.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.159.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.160.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.160.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.160.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.161.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.161.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.161.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.162.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.162.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.162.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.163.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.163.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.163.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.164.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.164.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.164.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.165.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.165.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.165.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.166.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.166.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.166.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.167.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.167.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.167.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.168.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.168.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.168.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.169.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.169.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.169.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.170.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.170.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.170.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.171.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.171.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.171.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.172.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.172.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.172.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.173.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.173.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.173.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.174.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.174.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.174.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.175.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.175.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.175.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.176.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.176.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.176.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.177.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.177.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.177.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.178.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.178.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.178.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.179.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.179.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.179.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.180.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.180.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.180.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.181.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.181.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.181.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.182.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.182.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.182.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.183.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.183.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.183.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.184.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.184.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.184.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.185.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.185.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.185.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.186.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.186.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.186.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.187.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.187.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.187.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.188.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.188.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.188.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.189.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.189.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.189.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.190.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.190.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.190.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.191.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.191.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.191.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.192.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.192.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.192.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.193.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.193.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.193.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.194.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.194.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.194.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.195.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.195.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.195.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.196.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.196.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.196.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.197.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.197.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.197.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.198.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.198.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.198.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.199.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.199.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.199.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.200.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.200.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.200.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.201.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.201.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.201.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.202.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.202.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.202.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.203.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.203.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.203.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.204.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.204.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.204.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.205.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.205.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.205.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.206.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.206.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.206.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.207.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.207.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.207.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.208.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.208.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.208.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.209.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.209.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.209.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.210.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.210.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.210.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.211.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.211.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.211.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.212.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.212.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.212.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.213.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.213.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.213.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.214.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.214.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.214.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.215.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.215.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.215.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.216.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.216.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.216.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.217.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.217.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.217.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.218.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.218.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.218.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.219.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.219.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.219.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.220.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.220.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.220.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.221.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.221.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.221.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.222.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.222.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.222.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.223.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.223.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.223.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.224.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.224.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.224.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.225.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.225.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.225.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.226.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.226.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.226.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.227.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.227.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.227.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.228.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.228.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.228.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.229.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.229.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.229.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.230.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.230.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.230.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.231.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.231.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.231.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.232.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.232.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.232.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.233.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.233.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.233.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.234.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.234.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.234.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.235.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.235.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.235.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.236.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.236.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.236.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.237.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.237.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.237.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.238.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.238.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.238.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.239.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.239.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.239.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.240.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.240.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.240.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.241.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.241.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.241.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.242.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.242.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.242.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.243.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.243.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.243.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.244.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.244.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.244.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.245.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.245.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.245.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.246.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.246.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.246.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.247.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.247.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.247.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.248.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.248.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.248.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.249.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.249.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.249.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.250.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.250.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.250.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.251.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.251.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.251.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.252.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.252.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.252.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.253.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.253.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.253.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.254.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.254.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.254.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.255.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.255.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.255.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.input_layernorm.weight": "model-00133-of-000163.safetensors", + "model.layers.50.post_attention_layernorm.weight": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.q_a_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.q_a_layernorm.weight": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.q_b_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.kv_a_proj_with_mqa.weight": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.kv_a_layernorm.weight": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.kv_b_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.o_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.gate.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.gate.e_score_correction_bias": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.shared_experts.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.shared_experts.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.shared_experts.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.0.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.0.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.0.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.1.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.1.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.1.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.2.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.2.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.2.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.3.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.3.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.3.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.4.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.4.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.4.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.5.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.5.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.5.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.6.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.6.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.6.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.7.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.7.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.7.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.8.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.8.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.8.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.9.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.9.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.9.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.10.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.10.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.10.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.11.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.11.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.11.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.12.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.12.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.12.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.13.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.13.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.13.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.14.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.14.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.14.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.15.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.15.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.15.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.16.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.16.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.16.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.17.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.17.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.17.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.18.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.18.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.18.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.19.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.19.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.19.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.20.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.20.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.20.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.21.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.21.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.21.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.22.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.22.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.22.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.23.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.23.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.23.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.24.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.24.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.24.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.25.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.25.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.25.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.26.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.26.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.26.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.27.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.27.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.27.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.28.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.28.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.28.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.29.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.29.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.29.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.30.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.30.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.30.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.31.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.31.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.31.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.32.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.32.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.32.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.33.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.33.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.33.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.34.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.34.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.34.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.35.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.35.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.35.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.36.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.36.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.36.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.37.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.37.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.37.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.38.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.38.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.38.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.39.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.39.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.39.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.40.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.40.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.40.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.41.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.41.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.41.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.42.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.42.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.42.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.43.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.43.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.43.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.44.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.44.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.44.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.45.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.45.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.45.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.46.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.46.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.46.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.47.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.47.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.47.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.48.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.48.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.48.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.49.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.49.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.49.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.50.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.50.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.50.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.51.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.51.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.51.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.52.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.52.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.52.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.53.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.53.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.53.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.54.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.54.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.54.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.55.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.55.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.55.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.56.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.56.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.56.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.57.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.57.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.57.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.58.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.58.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.58.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.59.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.59.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.59.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.60.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.60.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.60.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.61.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.61.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.61.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.62.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.62.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.62.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.63.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.63.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.63.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.64.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.64.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.64.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.65.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.65.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.65.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.66.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.66.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.66.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.67.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.67.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.67.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.68.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.68.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.68.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.69.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.69.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.69.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.70.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.70.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.70.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.71.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.71.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.71.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.72.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.72.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.72.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.73.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.73.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.73.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.74.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.74.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.74.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.75.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.75.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.75.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.76.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.76.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.76.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.77.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.77.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.77.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.78.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.78.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.78.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.79.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.79.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.79.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.80.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.80.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.80.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.81.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.81.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.81.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.82.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.82.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.82.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.83.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.83.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.83.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.84.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.84.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.84.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.85.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.85.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.85.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.86.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.86.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.86.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.87.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.87.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.87.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.88.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.88.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.88.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.89.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.89.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.89.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.90.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.90.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.90.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.91.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.91.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.91.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.92.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.92.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.92.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.93.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.93.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.93.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.94.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.94.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.94.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.95.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.95.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.95.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.96.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.96.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.96.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.97.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.97.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.97.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.98.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.98.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.98.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.99.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.99.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.99.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.100.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.100.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.100.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.101.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.101.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.101.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.102.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.102.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.102.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.103.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.103.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.103.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.104.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.104.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.104.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.105.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.105.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.105.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.106.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.106.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.106.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.107.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.107.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.107.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.108.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.108.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.108.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.109.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.109.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.109.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.110.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.110.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.110.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.111.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.111.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.111.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.112.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.112.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.112.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.113.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.113.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.113.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.114.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.114.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.114.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.115.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.115.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.115.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.116.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.116.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.116.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.117.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.117.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.117.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.118.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.118.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.118.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.119.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.119.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.119.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.120.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.120.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.120.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.121.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.121.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.121.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.122.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.122.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.122.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.123.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.123.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.123.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.124.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.124.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.124.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.125.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.125.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.125.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.126.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.126.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.126.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.127.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.127.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.127.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.128.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.128.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.128.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.129.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.129.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.129.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.130.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.130.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.130.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.131.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.131.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.131.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.132.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.132.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.132.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.133.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.133.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.133.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.134.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.134.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.134.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.135.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.135.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.135.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.136.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.136.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.136.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.137.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.137.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.137.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.138.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.138.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.138.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.139.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.139.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.139.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.140.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.140.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.140.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.141.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.141.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.141.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.142.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.142.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.142.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.143.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.143.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.143.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.144.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.144.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.144.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.145.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.145.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.145.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.146.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.146.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.146.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.147.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.147.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.147.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.148.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.148.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.148.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.149.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.149.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.149.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.150.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.150.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.150.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.151.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.151.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.151.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.152.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.152.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.152.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.153.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.153.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.153.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.154.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.154.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.154.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.155.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.155.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.155.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.156.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.156.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.156.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.157.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.157.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.157.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.158.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.158.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.158.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.159.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.159.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.159.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.160.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.160.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.160.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.161.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.161.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.161.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.162.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.162.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.162.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.163.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.163.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.163.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.164.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.164.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.164.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.165.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.165.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.165.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.166.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.166.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.166.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.167.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.167.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.167.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.168.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.168.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.168.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.169.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.169.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.169.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.170.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.170.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.170.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.171.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.171.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.171.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.172.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.172.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.172.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.173.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.173.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.173.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.174.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.174.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.174.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.175.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.175.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.175.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.176.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.176.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.176.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.177.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.177.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.177.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.178.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.178.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.178.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.179.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.179.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.179.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.180.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.180.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.180.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.181.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.181.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.181.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.182.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.182.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.182.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.183.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.183.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.183.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.184.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.184.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.184.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.185.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.185.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.185.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.186.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.186.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.186.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.187.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.187.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.187.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.188.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.188.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.188.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.189.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.189.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.189.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.190.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.190.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.190.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.191.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.191.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.191.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.192.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.192.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.192.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.193.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.193.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.193.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.194.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.194.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.194.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.195.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.195.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.195.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.196.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.196.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.196.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.197.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.197.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.197.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.198.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.198.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.198.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.199.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.199.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.199.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.200.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.200.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.200.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.201.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.201.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.201.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.202.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.202.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.202.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.203.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.203.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.203.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.204.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.204.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.204.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.205.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.205.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.205.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.206.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.206.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.206.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.207.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.207.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.207.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.208.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.208.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.208.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.209.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.209.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.209.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.210.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.210.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.210.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.211.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.211.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.211.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.212.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.212.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.212.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.213.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.213.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.213.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.214.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.214.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.214.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.215.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.215.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.215.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.216.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.216.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.216.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.217.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.217.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.217.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.218.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.218.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.218.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.219.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.219.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.219.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.220.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.220.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.220.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.221.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.221.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.221.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.222.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.222.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.222.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.223.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.223.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.223.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.224.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.224.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.224.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.225.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.225.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.225.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.226.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.226.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.226.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.227.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.227.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.227.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.228.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.228.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.228.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.229.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.229.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.229.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.230.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.230.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.230.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.231.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.231.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.231.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.232.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.232.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.232.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.233.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.233.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.233.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.234.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.234.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.234.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.235.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.235.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.235.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.236.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.236.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.236.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.237.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.237.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.237.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.238.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.238.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.238.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.239.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.239.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.239.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.240.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.240.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.240.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.241.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.241.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.241.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.242.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.242.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.242.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.243.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.243.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.243.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.244.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.244.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.244.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.245.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.245.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.245.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.246.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.246.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.246.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.247.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.247.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.247.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.248.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.248.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.248.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.249.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.249.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.249.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.250.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.250.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.250.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.251.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.251.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.251.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.252.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.252.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.252.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.253.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.253.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.253.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.254.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.254.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.254.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.255.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.255.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.255.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.input_layernorm.weight": "model-00136-of-000163.safetensors", + "model.layers.51.post_attention_layernorm.weight": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.q_a_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.q_a_layernorm.weight": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.q_b_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.kv_a_proj_with_mqa.weight": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.kv_a_layernorm.weight": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.kv_b_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.o_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.gate.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.gate.e_score_correction_bias": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.shared_experts.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.shared_experts.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.shared_experts.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.0.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.0.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.0.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.1.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.1.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.1.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.2.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.2.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.2.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.3.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.3.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.3.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.4.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.4.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.4.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.5.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.5.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.5.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.6.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.6.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.6.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.7.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.7.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.7.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.8.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.8.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.8.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.9.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.9.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.9.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.10.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.10.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.10.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.11.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.11.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.11.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.12.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.12.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.12.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.13.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.13.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.13.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.14.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.14.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.14.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.15.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.15.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.15.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.16.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.16.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.16.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.17.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.17.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.17.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.18.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.18.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.18.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.19.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.19.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.19.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.20.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.20.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.20.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.21.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.21.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.21.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.22.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.22.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.22.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.23.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.23.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.23.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.24.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.24.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.24.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.25.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.25.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.25.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.26.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.26.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.26.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.27.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.27.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.27.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.28.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.28.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.28.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.29.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.29.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.29.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.30.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.30.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.30.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.31.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.31.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.31.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.32.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.32.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.32.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.33.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.33.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.33.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.34.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.34.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.34.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.35.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.35.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.35.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.36.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.36.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.36.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.37.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.37.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.37.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.38.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.38.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.38.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.39.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.39.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.39.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.40.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.40.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.40.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.41.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.41.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.41.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.42.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.42.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.42.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.43.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.43.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.43.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.44.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.44.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.44.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.45.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.45.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.45.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.46.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.46.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.46.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.47.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.47.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.47.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.48.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.48.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.48.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.49.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.49.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.49.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.50.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.50.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.50.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.51.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.51.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.51.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.52.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.52.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.52.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.53.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.53.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.53.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.54.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.54.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.54.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.55.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.55.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.55.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.56.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.56.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.56.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.57.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.57.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.57.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.58.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.58.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.58.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.59.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.59.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.59.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.60.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.60.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.60.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.61.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.61.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.61.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.62.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.62.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.62.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.63.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.63.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.63.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.64.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.64.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.64.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.65.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.65.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.65.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.66.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.66.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.66.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.67.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.67.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.67.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.68.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.68.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.68.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.69.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.69.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.69.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.70.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.70.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.70.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.71.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.71.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.71.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.72.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.72.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.72.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.73.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.73.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.73.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.74.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.74.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.74.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.75.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.75.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.75.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.76.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.76.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.76.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.77.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.77.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.77.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.78.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.78.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.78.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.79.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.79.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.79.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.80.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.80.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.80.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.81.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.81.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.81.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.82.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.82.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.82.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.83.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.83.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.83.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.84.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.84.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.84.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.85.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.85.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.85.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.86.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.86.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.86.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.87.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.87.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.87.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.88.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.88.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.88.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.89.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.89.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.89.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.90.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.90.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.90.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.91.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.91.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.91.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.92.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.92.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.92.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.93.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.93.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.93.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.94.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.94.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.94.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.95.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.95.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.95.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.96.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.96.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.96.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.97.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.97.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.97.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.98.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.98.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.98.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.99.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.99.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.99.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.100.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.100.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.100.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.101.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.101.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.101.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.102.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.102.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.102.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.103.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.103.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.103.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.104.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.104.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.104.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.105.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.105.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.105.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.106.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.106.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.106.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.107.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.107.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.107.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.108.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.108.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.108.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.109.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.109.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.109.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.110.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.110.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.110.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.111.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.111.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.111.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.112.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.112.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.112.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.113.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.113.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.113.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.114.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.114.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.114.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.115.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.115.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.115.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.116.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.116.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.116.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.117.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.117.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.117.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.118.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.118.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.118.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.119.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.119.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.119.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.120.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.120.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.120.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.121.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.121.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.121.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.122.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.122.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.122.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.123.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.123.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.123.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.124.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.124.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.124.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.125.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.125.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.125.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.126.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.126.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.126.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.127.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.127.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.127.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.128.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.128.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.128.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.129.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.129.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.129.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.130.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.130.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.130.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.131.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.131.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.131.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.132.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.132.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.132.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.133.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.133.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.133.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.134.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.134.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.134.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.135.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.135.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.135.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.136.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.136.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.136.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.137.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.137.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.137.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.138.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.138.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.138.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.139.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.139.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.139.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.140.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.140.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.140.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.141.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.141.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.141.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.142.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.142.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.142.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.143.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.143.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.143.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.144.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.144.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.144.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.145.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.145.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.145.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.146.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.146.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.146.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.147.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.147.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.147.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.148.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.148.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.148.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.149.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.149.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.149.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.150.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.150.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.150.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.151.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.151.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.151.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.152.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.152.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.152.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.153.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.153.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.153.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.154.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.154.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.154.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.155.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.155.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.155.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.156.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.156.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.156.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.157.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.157.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.157.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.158.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.158.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.158.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.159.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.159.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.159.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.160.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.160.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.160.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.161.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.161.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.161.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.162.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.162.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.162.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.163.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.163.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.163.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.164.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.164.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.164.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.165.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.165.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.165.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.166.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.166.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.166.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.167.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.167.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.167.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.168.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.168.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.168.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.169.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.169.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.169.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.170.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.170.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.170.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.171.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.171.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.171.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.172.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.172.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.172.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.173.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.173.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.173.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.174.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.174.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.174.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.175.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.175.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.175.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.176.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.176.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.176.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.177.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.177.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.177.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.178.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.178.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.178.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.179.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.179.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.179.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.180.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.180.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.180.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.181.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.181.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.181.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.182.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.182.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.182.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.183.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.183.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.183.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.184.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.184.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.184.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.185.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.185.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.185.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.186.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.186.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.186.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.187.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.187.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.187.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.188.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.188.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.188.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.189.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.189.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.189.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.190.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.190.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.190.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.191.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.191.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.191.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.192.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.192.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.192.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.193.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.193.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.193.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.194.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.194.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.194.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.195.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.195.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.195.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.196.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.196.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.196.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.197.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.197.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.197.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.198.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.198.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.198.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.199.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.199.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.199.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.200.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.200.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.200.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.201.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.201.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.201.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.202.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.202.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.202.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.203.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.203.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.203.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.204.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.204.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.204.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.205.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.205.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.205.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.206.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.206.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.206.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.207.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.207.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.207.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.208.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.208.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.208.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.209.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.209.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.209.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.210.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.210.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.210.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.211.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.211.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.211.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.212.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.212.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.212.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.213.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.213.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.213.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.214.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.214.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.214.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.215.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.215.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.215.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.216.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.216.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.216.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.217.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.217.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.217.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.218.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.218.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.218.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.219.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.219.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.219.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.220.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.220.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.220.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.221.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.221.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.221.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.222.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.222.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.222.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.223.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.223.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.223.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.224.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.224.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.224.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.225.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.225.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.225.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.226.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.226.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.226.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.227.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.227.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.227.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.228.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.228.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.228.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.229.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.229.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.229.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.230.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.230.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.230.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.231.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.231.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.231.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.232.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.232.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.232.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.233.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.233.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.233.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.234.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.234.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.234.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.235.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.235.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.235.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.236.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.236.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.236.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.237.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.237.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.237.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.238.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.238.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.238.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.239.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.239.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.239.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.240.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.240.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.240.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.241.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.241.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.241.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.242.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.242.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.242.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.243.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.243.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.243.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.244.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.244.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.244.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.245.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.245.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.245.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.246.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.246.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.246.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.247.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.247.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.247.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.248.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.248.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.248.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.249.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.249.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.249.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.250.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.250.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.250.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.251.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.251.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.251.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.252.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.252.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.252.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.253.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.253.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.253.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.254.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.254.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.254.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.255.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.255.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.255.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.input_layernorm.weight": "model-00139-of-000163.safetensors", + "model.layers.52.post_attention_layernorm.weight": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.q_a_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.q_a_layernorm.weight": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.q_b_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.kv_a_proj_with_mqa.weight": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.kv_a_layernorm.weight": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.kv_b_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.o_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.gate.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.gate.e_score_correction_bias": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.shared_experts.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.shared_experts.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.shared_experts.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.0.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.0.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.0.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.1.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.1.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.1.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.2.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.2.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.2.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.3.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.3.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.3.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.4.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.4.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.4.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.5.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.5.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.5.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.6.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.6.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.6.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.7.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.7.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.7.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.8.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.8.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.8.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.9.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.9.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.9.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.10.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.10.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.10.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.11.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.11.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.11.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.12.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.12.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.12.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.13.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.13.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.13.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.14.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.14.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.14.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.15.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.15.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.15.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.16.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.16.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.16.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.17.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.17.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.17.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.18.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.18.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.18.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.19.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.19.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.19.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.20.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.20.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.20.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.21.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.21.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.21.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.22.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.22.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.22.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.23.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.23.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.23.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.24.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.24.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.24.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.25.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.25.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.25.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.26.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.26.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.26.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.27.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.27.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.27.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.28.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.28.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.28.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.29.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.29.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.29.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.30.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.30.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.30.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.31.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.31.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.31.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.32.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.32.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.32.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.33.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.33.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.33.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.34.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.34.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.34.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.35.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.35.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.35.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.36.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.36.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.36.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.37.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.37.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.37.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.38.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.38.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.38.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.39.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.39.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.39.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.40.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.40.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.40.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.41.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.41.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.41.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.42.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.42.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.42.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.43.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.43.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.43.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.44.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.44.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.44.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.45.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.45.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.45.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.46.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.46.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.46.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.47.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.47.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.47.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.48.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.48.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.48.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.49.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.49.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.49.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.50.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.50.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.50.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.51.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.51.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.51.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.52.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.52.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.52.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.53.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.53.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.53.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.54.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.54.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.54.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.55.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.55.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.55.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.56.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.56.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.56.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.57.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.57.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.57.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.58.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.58.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.58.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.59.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.59.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.59.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.60.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.60.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.60.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.61.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.61.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.61.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.62.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.62.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.62.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.63.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.63.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.63.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.64.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.64.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.64.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.65.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.65.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.65.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.66.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.66.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.66.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.67.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.67.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.67.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.68.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.68.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.68.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.69.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.69.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.69.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.70.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.70.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.70.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.71.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.71.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.71.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.72.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.72.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.72.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.73.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.73.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.73.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.74.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.74.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.74.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.75.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.75.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.75.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.76.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.76.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.76.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.77.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.77.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.77.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.78.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.78.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.78.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.79.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.79.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.79.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.80.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.80.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.80.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.81.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.81.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.81.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.82.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.82.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.82.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.83.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.83.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.83.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.84.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.84.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.84.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.85.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.85.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.85.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.86.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.86.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.86.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.87.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.87.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.87.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.88.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.88.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.88.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.89.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.89.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.89.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.90.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.90.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.90.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.91.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.91.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.91.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.92.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.92.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.92.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.93.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.93.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.93.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.94.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.94.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.94.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.95.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.95.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.95.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.96.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.96.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.96.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.97.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.97.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.97.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.98.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.98.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.98.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.99.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.99.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.99.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.100.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.100.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.100.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.101.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.101.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.101.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.102.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.102.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.102.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.103.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.103.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.103.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.104.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.104.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.104.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.105.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.105.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.105.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.106.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.106.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.106.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.107.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.107.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.107.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.108.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.108.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.108.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.109.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.109.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.109.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.110.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.110.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.110.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.111.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.111.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.111.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.112.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.112.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.112.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.113.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.113.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.113.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.114.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.114.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.114.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.115.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.115.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.115.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.116.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.116.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.116.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.117.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.117.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.117.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.118.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.118.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.118.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.119.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.119.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.119.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.120.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.120.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.120.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.121.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.121.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.121.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.122.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.122.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.122.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.123.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.123.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.123.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.124.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.124.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.124.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.125.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.125.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.125.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.126.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.126.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.126.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.127.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.127.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.127.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.128.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.128.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.128.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.129.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.129.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.129.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.130.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.130.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.130.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.131.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.131.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.131.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.132.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.132.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.132.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.133.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.133.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.133.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.134.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.134.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.134.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.135.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.135.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.135.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.136.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.136.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.136.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.137.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.137.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.137.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.138.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.138.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.138.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.139.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.139.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.139.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.140.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.140.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.140.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.141.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.141.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.141.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.142.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.142.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.142.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.143.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.143.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.143.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.144.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.144.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.144.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.145.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.145.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.145.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.146.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.146.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.146.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.147.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.147.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.147.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.148.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.148.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.148.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.149.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.149.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.149.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.150.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.150.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.150.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.151.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.151.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.151.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.152.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.152.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.152.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.153.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.153.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.153.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.154.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.154.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.154.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.155.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.155.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.155.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.156.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.156.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.156.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.157.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.157.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.157.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.158.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.158.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.158.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.159.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.159.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.159.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.160.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.160.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.160.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.161.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.161.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.161.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.162.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.162.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.162.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.163.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.163.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.163.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.164.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.164.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.164.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.165.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.165.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.165.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.166.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.166.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.166.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.167.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.167.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.167.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.168.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.168.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.168.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.169.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.169.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.169.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.170.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.170.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.170.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.171.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.171.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.171.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.172.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.172.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.172.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.173.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.173.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.173.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.174.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.174.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.174.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.175.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.175.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.175.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.176.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.176.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.176.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.177.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.177.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.177.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.178.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.178.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.178.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.179.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.179.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.179.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.180.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.180.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.180.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.181.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.181.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.181.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.182.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.182.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.182.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.183.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.183.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.183.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.184.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.184.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.184.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.185.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.185.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.185.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.186.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.186.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.186.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.187.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.187.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.187.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.188.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.188.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.188.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.189.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.189.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.189.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.190.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.190.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.190.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.191.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.191.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.191.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.192.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.192.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.192.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.193.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.193.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.193.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.194.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.194.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.194.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.195.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.195.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.195.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.196.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.196.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.196.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.197.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.197.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.197.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.198.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.198.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.198.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.199.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.199.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.199.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.200.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.200.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.200.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.201.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.201.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.201.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.202.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.202.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.202.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.203.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.203.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.203.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.204.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.204.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.204.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.205.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.205.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.205.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.206.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.206.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.206.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.207.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.207.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.207.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.208.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.208.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.208.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.209.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.209.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.209.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.210.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.210.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.210.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.211.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.211.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.211.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.212.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.212.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.212.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.213.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.213.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.213.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.214.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.214.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.214.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.215.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.215.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.215.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.216.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.216.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.216.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.217.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.217.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.217.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.218.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.218.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.218.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.219.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.219.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.219.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.220.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.220.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.220.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.221.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.221.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.221.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.222.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.222.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.222.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.223.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.223.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.223.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.224.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.224.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.224.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.225.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.225.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.225.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.226.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.226.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.226.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.227.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.227.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.227.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.228.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.228.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.228.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.229.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.229.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.229.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.230.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.230.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.230.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.231.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.231.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.231.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.232.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.232.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.232.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.233.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.233.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.233.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.234.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.234.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.234.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.235.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.235.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.235.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.236.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.236.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.236.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.237.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.237.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.237.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.238.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.238.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.238.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.239.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.239.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.239.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.240.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.240.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.240.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.241.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.241.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.241.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.242.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.242.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.242.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.243.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.243.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.243.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.244.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.244.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.244.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.245.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.245.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.245.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.246.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.246.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.246.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.247.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.247.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.247.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.248.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.248.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.248.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.249.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.249.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.249.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.250.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.250.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.250.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.251.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.251.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.251.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.252.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.252.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.252.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.253.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.253.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.253.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.254.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.254.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.254.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.255.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.255.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.255.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.input_layernorm.weight": "model-00141-of-000163.safetensors", + "model.layers.53.post_attention_layernorm.weight": "model-00141-of-000163.safetensors", + "model.layers.54.self_attn.q_a_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.self_attn.q_a_layernorm.weight": "model-00142-of-000163.safetensors", + "model.layers.54.self_attn.q_b_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.self_attn.kv_a_proj_with_mqa.weight": "model-00142-of-000163.safetensors", + "model.layers.54.self_attn.kv_a_layernorm.weight": "model-00142-of-000163.safetensors", + "model.layers.54.self_attn.kv_b_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.self_attn.o_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.gate.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.gate.e_score_correction_bias": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.shared_experts.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.shared_experts.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.shared_experts.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.0.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.0.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.0.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.1.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.1.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.1.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.2.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.2.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.2.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.3.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.3.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.3.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.4.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.4.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.4.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.5.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.5.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.5.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.6.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.6.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.6.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.7.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.7.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.7.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.8.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.8.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.8.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.9.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.9.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.9.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.10.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.10.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.10.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.11.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.11.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.11.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.12.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.12.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.12.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.13.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.13.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.13.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.14.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.14.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.14.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.15.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.15.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.15.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.16.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.16.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.16.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.17.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.17.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.17.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.18.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.18.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.18.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.19.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.19.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.19.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.20.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.20.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.20.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.21.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.21.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.21.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.22.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.22.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.22.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.23.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.23.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.23.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.24.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.24.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.24.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.25.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.25.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.25.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.26.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.26.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.26.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.27.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.27.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.27.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.28.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.28.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.28.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.29.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.29.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.29.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.30.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.30.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.30.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.31.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.31.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.31.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.32.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.32.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.32.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.33.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.33.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.33.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.34.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.34.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.34.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.35.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.35.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.35.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.36.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.36.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.36.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.37.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.37.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.37.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.38.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.38.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.38.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.39.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.39.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.39.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.40.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.40.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.40.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.41.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.41.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.41.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.42.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.42.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.42.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.43.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.43.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.43.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.44.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.44.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.44.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.45.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.45.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.45.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.46.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.46.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.46.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.47.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.47.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.47.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.48.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.48.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.48.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.49.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.49.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.49.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.50.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.50.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.50.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.51.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.51.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.51.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.52.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.52.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.52.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.53.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.53.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.53.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.54.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.54.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.54.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.55.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.55.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.55.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.56.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.56.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.56.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.57.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.57.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.57.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.58.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.58.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.58.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.59.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.59.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.59.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.60.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.60.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.60.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.61.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.61.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.61.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.62.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.62.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.62.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.63.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.63.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.63.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.64.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.64.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.64.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.65.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.65.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.65.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.66.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.66.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.66.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.67.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.67.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.67.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.68.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.68.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.68.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.69.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.69.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.69.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.70.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.70.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.70.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.71.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.71.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.71.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.72.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.72.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.72.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.73.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.73.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.73.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.74.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.74.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.74.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.75.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.75.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.75.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.76.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.76.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.76.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.77.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.77.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.77.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.78.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.78.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.78.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.79.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.79.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.79.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.80.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.80.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.80.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.81.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.81.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.81.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.82.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.82.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.82.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.83.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.83.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.83.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.84.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.84.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.84.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.85.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.85.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.85.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.86.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.86.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.86.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.87.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.87.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.87.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.88.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.88.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.88.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.89.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.89.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.89.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.90.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.90.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.90.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.91.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.91.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.91.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.92.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.92.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.92.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.93.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.93.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.93.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.94.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.94.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.94.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.95.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.95.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.95.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.96.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.96.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.96.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.97.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.97.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.97.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.98.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.98.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.98.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.99.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.99.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.99.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.100.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.100.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.100.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.101.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.101.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.101.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.102.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.102.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.102.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.103.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.103.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.103.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.104.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.104.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.104.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.105.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.105.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.105.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.106.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.106.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.106.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.107.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.107.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.107.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.108.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.108.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.108.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.109.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.109.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.109.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.110.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.110.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.110.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.111.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.111.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.111.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.112.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.112.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.112.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.113.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.113.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.113.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.114.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.114.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.114.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.115.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.115.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.115.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.116.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.116.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.116.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.117.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.117.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.117.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.118.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.118.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.118.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.119.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.119.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.119.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.120.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.120.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.120.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.121.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.121.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.121.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.122.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.122.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.122.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.123.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.123.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.123.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.124.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.124.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.124.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.125.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.125.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.125.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.126.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.126.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.126.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.127.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.127.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.127.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.128.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.128.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.128.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.129.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.129.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.129.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.130.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.130.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.130.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.131.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.131.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.131.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.132.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.132.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.132.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.133.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.133.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.133.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.134.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.134.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.134.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.135.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.135.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.135.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.136.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.136.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.136.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.137.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.137.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.137.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.138.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.138.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.138.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.139.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.139.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.139.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.140.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.140.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.140.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.141.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.141.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.141.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.142.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.142.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.142.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.143.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.143.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.143.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.144.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.144.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.144.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.145.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.145.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.145.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.146.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.146.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.146.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.147.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.147.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.147.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.148.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.148.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.148.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.149.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.149.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.149.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.150.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.150.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.150.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.151.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.151.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.151.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.152.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.152.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.152.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.153.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.153.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.153.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.154.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.154.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.154.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.155.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.155.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.155.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.156.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.156.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.156.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.157.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.157.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.157.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.158.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.158.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.158.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.159.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.159.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.159.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.160.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.160.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.160.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.161.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.161.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.161.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.162.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.162.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.162.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.163.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.163.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.163.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.164.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.164.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.164.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.165.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.165.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.165.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.166.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.166.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.166.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.167.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.167.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.167.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.168.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.168.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.168.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.169.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.169.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.169.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.170.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.170.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.170.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.171.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.171.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.171.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.172.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.172.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.172.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.173.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.173.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.173.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.174.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.174.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.174.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.175.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.175.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.175.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.176.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.176.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.176.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.177.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.177.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.177.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.178.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.178.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.178.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.179.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.179.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.179.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.180.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.180.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.180.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.181.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.181.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.181.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.182.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.182.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.182.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.183.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.183.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.183.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.184.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.184.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.184.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.185.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.185.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.185.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.186.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.186.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.186.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.187.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.187.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.187.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.188.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.188.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.188.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.189.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.189.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.189.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.190.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.190.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.190.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.191.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.191.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.191.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.192.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.192.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.192.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.193.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.193.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.193.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.194.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.194.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.194.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.195.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.195.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.195.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.196.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.196.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.196.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.197.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.197.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.197.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.198.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.198.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.198.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.199.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.199.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.199.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.200.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.200.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.200.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.201.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.201.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.201.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.202.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.202.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.202.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.203.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.203.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.203.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.204.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.204.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.204.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.205.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.205.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.205.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.206.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.206.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.206.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.207.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.207.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.207.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.208.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.208.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.208.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.209.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.209.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.209.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.210.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.210.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.210.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.211.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.211.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.211.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.212.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.212.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.212.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.213.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.213.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.213.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.214.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.214.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.214.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.215.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.215.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.215.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.216.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.216.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.216.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.217.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.217.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.217.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.218.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.218.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.218.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.219.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.219.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.219.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.220.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.220.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.220.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.221.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.221.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.221.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.222.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.222.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.222.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.223.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.223.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.223.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.224.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.224.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.224.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.225.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.225.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.225.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.226.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.226.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.226.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.227.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.227.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.227.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.228.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.228.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.228.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.229.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.229.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.229.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.230.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.230.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.230.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.231.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.231.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.231.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.232.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.232.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.232.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.233.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.233.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.233.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.234.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.234.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.234.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.235.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.235.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.235.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.236.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.236.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.236.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.237.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.237.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.237.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.238.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.238.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.238.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.239.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.239.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.239.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.240.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.240.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.240.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.241.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.241.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.241.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.242.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.242.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.242.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.243.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.243.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.243.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.244.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.244.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.244.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.245.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.245.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.245.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.246.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.246.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.246.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.247.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.247.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.247.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.248.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.248.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.248.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.249.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.249.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.249.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.250.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.250.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.250.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.251.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.251.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.251.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.252.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.252.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.252.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.253.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.253.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.253.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.254.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.254.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.254.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.255.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.255.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.255.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.input_layernorm.weight": "model-00144-of-000163.safetensors", + "model.layers.54.post_attention_layernorm.weight": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.q_a_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.q_a_layernorm.weight": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.q_b_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.kv_a_proj_with_mqa.weight": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.kv_a_layernorm.weight": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.kv_b_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.o_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.gate.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.gate.e_score_correction_bias": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.shared_experts.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.shared_experts.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.shared_experts.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.0.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.0.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.0.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.1.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.1.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.1.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.2.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.2.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.2.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.3.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.3.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.3.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.4.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.4.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.4.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.5.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.5.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.5.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.6.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.6.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.6.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.7.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.7.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.7.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.8.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.8.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.8.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.9.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.9.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.9.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.10.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.10.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.10.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.11.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.11.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.11.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.12.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.12.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.12.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.13.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.13.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.13.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.14.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.14.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.14.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.15.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.15.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.15.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.16.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.16.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.16.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.17.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.17.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.17.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.18.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.18.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.18.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.19.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.19.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.19.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.20.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.20.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.20.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.21.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.21.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.21.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.22.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.22.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.22.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.23.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.23.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.23.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.24.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.24.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.24.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.25.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.25.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.25.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.26.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.26.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.26.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.27.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.27.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.27.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.28.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.28.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.28.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.29.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.29.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.29.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.30.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.30.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.30.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.31.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.31.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.31.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.32.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.32.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.32.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.33.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.33.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.33.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.34.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.34.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.34.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.35.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.35.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.35.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.36.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.36.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.36.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.37.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.37.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.37.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.38.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.38.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.38.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.39.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.39.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.39.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.40.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.40.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.40.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.41.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.41.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.41.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.42.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.42.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.42.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.43.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.43.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.43.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.44.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.44.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.44.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.45.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.45.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.45.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.46.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.46.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.46.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.47.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.47.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.47.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.48.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.48.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.48.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.49.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.49.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.49.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.50.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.50.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.50.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.51.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.51.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.51.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.52.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.52.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.52.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.53.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.53.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.53.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.54.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.54.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.54.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.55.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.55.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.55.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.56.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.56.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.56.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.57.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.57.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.57.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.58.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.58.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.58.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.59.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.59.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.59.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.60.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.60.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.60.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.61.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.61.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.61.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.62.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.62.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.62.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.63.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.63.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.63.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.64.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.64.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.64.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.65.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.65.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.65.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.66.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.66.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.66.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.67.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.67.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.67.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.68.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.68.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.68.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.69.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.69.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.69.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.70.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.70.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.70.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.71.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.71.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.71.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.72.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.72.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.72.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.73.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.73.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.73.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.74.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.74.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.74.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.75.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.75.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.75.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.76.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.76.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.76.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.77.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.77.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.77.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.78.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.78.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.78.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.79.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.79.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.79.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.80.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.80.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.80.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.81.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.81.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.81.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.82.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.82.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.82.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.83.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.83.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.83.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.84.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.84.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.84.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.85.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.85.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.85.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.86.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.86.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.86.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.87.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.87.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.87.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.88.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.88.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.88.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.89.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.89.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.89.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.90.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.90.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.90.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.91.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.91.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.91.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.92.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.92.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.92.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.93.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.93.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.93.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.94.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.94.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.94.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.95.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.95.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.95.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.96.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.96.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.96.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.97.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.97.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.97.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.98.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.98.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.98.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.99.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.99.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.99.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.100.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.100.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.100.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.101.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.101.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.101.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.102.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.102.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.102.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.103.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.103.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.103.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.104.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.104.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.104.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.105.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.105.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.105.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.106.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.106.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.106.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.107.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.107.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.107.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.108.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.108.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.108.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.109.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.109.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.109.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.110.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.110.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.110.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.111.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.111.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.111.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.112.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.112.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.112.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.113.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.113.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.113.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.114.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.114.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.114.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.115.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.115.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.115.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.116.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.116.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.116.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.117.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.117.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.117.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.118.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.118.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.118.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.119.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.119.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.119.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.120.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.120.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.120.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.121.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.121.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.121.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.122.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.122.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.122.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.123.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.123.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.123.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.124.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.124.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.124.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.125.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.125.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.125.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.126.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.126.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.126.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.127.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.127.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.127.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.128.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.128.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.128.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.129.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.129.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.129.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.130.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.130.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.130.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.131.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.131.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.131.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.132.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.132.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.132.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.133.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.133.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.133.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.134.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.134.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.134.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.135.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.135.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.135.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.136.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.136.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.136.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.137.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.137.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.137.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.138.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.138.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.138.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.139.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.139.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.139.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.140.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.140.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.140.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.141.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.141.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.141.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.142.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.142.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.142.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.143.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.143.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.143.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.144.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.144.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.144.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.145.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.145.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.145.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.146.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.146.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.146.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.147.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.147.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.147.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.148.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.148.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.148.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.149.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.149.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.149.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.150.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.150.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.150.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.151.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.151.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.151.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.152.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.152.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.152.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.153.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.153.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.153.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.154.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.154.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.154.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.155.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.155.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.155.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.156.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.156.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.156.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.157.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.157.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.157.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.158.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.158.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.158.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.159.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.159.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.159.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.160.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.160.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.160.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.161.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.161.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.161.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.162.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.162.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.162.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.163.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.163.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.163.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.164.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.164.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.164.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.165.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.165.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.165.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.166.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.166.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.166.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.167.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.167.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.167.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.168.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.168.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.168.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.169.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.169.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.169.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.170.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.170.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.170.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.171.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.171.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.171.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.172.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.172.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.172.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.173.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.173.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.173.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.174.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.174.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.174.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.175.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.175.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.175.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.176.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.176.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.176.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.177.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.177.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.177.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.178.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.178.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.178.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.179.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.179.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.179.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.180.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.180.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.180.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.181.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.181.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.181.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.182.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.182.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.182.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.183.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.183.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.183.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.184.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.184.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.184.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.185.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.185.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.185.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.186.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.186.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.186.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.187.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.187.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.187.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.188.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.188.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.188.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.189.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.189.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.189.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.190.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.190.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.190.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.191.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.191.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.191.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.192.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.192.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.192.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.193.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.193.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.193.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.194.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.194.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.194.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.195.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.195.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.195.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.196.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.196.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.196.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.197.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.197.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.197.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.198.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.198.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.198.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.199.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.199.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.199.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.200.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.200.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.200.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.201.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.201.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.201.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.202.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.202.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.202.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.203.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.203.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.203.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.204.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.204.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.204.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.205.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.205.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.205.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.206.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.206.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.206.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.207.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.207.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.207.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.208.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.208.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.208.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.209.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.209.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.209.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.210.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.210.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.210.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.211.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.211.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.211.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.212.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.212.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.212.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.213.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.213.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.213.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.214.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.214.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.214.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.215.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.215.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.215.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.216.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.216.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.216.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.217.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.217.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.217.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.218.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.218.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.218.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.219.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.219.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.219.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.220.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.220.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.220.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.221.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.221.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.221.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.222.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.222.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.222.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.223.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.223.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.223.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.224.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.224.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.224.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.225.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.225.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.225.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.226.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.226.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.226.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.227.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.227.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.227.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.228.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.228.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.228.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.229.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.229.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.229.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.230.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.230.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.230.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.231.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.231.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.231.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.232.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.232.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.232.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.233.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.233.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.233.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.234.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.234.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.234.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.235.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.235.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.235.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.236.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.236.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.236.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.237.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.237.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.237.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.238.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.238.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.238.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.239.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.239.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.239.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.240.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.240.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.240.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.241.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.241.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.241.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.242.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.242.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.242.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.243.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.243.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.243.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.244.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.244.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.244.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.245.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.245.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.245.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.246.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.246.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.246.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.247.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.247.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.247.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.248.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.248.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.248.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.249.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.249.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.249.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.250.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.250.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.250.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.251.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.251.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.251.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.252.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.252.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.252.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.253.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.253.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.253.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.254.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.254.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.254.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.255.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.255.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.255.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.input_layernorm.weight": "model-00147-of-000163.safetensors", + "model.layers.55.post_attention_layernorm.weight": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.q_a_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.q_a_layernorm.weight": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.q_b_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.kv_a_proj_with_mqa.weight": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.kv_a_layernorm.weight": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.kv_b_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.o_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.gate.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.gate.e_score_correction_bias": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.shared_experts.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.shared_experts.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.shared_experts.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.0.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.0.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.0.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.1.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.1.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.1.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.2.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.2.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.2.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.3.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.3.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.3.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.4.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.4.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.4.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.5.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.5.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.5.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.6.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.6.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.6.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.7.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.7.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.7.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.8.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.8.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.8.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.9.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.9.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.9.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.10.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.10.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.10.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.11.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.11.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.11.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.12.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.12.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.12.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.13.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.13.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.13.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.14.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.14.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.14.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.15.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.15.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.15.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.16.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.16.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.16.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.17.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.17.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.17.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.18.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.18.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.18.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.19.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.19.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.19.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.20.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.20.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.20.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.21.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.21.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.21.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.22.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.22.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.22.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.23.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.23.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.23.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.24.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.24.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.24.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.25.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.25.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.25.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.26.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.26.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.26.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.27.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.27.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.27.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.28.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.28.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.28.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.29.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.29.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.29.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.30.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.30.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.30.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.31.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.31.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.31.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.32.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.32.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.32.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.33.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.33.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.33.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.34.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.34.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.34.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.35.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.35.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.35.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.36.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.36.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.36.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.37.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.37.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.37.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.38.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.38.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.38.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.39.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.39.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.39.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.40.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.40.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.40.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.41.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.41.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.41.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.42.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.42.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.42.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.43.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.43.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.43.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.44.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.44.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.44.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.45.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.45.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.45.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.46.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.46.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.46.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.47.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.47.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.47.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.48.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.48.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.48.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.49.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.49.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.49.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.50.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.50.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.50.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.51.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.51.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.51.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.52.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.52.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.52.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.53.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.53.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.53.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.54.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.54.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.54.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.55.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.55.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.55.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.56.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.56.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.56.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.57.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.57.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.57.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.58.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.58.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.58.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.59.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.59.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.59.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.60.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.60.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.60.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.61.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.61.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.61.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.62.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.62.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.62.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.63.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.63.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.63.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.64.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.64.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.64.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.65.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.65.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.65.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.66.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.66.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.66.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.67.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.67.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.67.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.68.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.68.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.68.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.69.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.69.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.69.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.70.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.70.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.70.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.71.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.71.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.71.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.72.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.72.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.72.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.73.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.73.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.73.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.74.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.74.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.74.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.75.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.75.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.75.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.76.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.76.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.76.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.77.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.77.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.77.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.78.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.78.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.78.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.79.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.79.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.79.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.80.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.80.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.80.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.81.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.81.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.81.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.82.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.82.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.82.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.83.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.83.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.83.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.84.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.84.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.84.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.85.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.85.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.85.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.86.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.86.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.86.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.87.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.87.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.87.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.88.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.88.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.88.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.89.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.89.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.89.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.90.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.90.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.90.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.91.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.91.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.91.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.92.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.92.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.92.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.93.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.93.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.93.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.94.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.94.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.94.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.95.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.95.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.95.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.96.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.96.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.96.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.97.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.97.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.97.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.98.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.98.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.98.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.99.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.99.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.99.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.100.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.100.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.100.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.101.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.101.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.101.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.102.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.102.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.102.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.103.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.103.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.103.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.104.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.104.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.104.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.105.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.105.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.105.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.106.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.106.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.106.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.107.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.107.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.107.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.108.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.108.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.108.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.109.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.109.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.109.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.110.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.110.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.110.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.111.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.111.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.111.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.112.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.112.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.112.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.113.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.113.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.113.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.114.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.114.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.114.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.115.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.115.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.115.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.116.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.116.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.116.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.117.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.117.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.117.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.118.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.118.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.118.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.119.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.119.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.119.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.120.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.120.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.120.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.121.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.121.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.121.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.122.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.122.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.122.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.123.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.123.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.123.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.124.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.124.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.124.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.125.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.125.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.125.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.126.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.126.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.126.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.127.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.127.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.127.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.128.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.128.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.128.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.129.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.129.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.129.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.130.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.130.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.130.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.131.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.131.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.131.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.132.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.132.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.132.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.133.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.133.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.133.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.134.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.134.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.134.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.135.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.135.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.135.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.136.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.136.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.136.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.137.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.137.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.137.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.138.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.138.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.138.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.139.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.139.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.139.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.140.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.140.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.140.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.141.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.141.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.141.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.142.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.142.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.142.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.143.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.143.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.143.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.144.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.144.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.144.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.145.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.145.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.145.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.146.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.146.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.146.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.147.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.147.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.147.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.148.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.148.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.148.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.149.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.149.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.149.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.150.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.150.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.150.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.151.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.151.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.151.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.152.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.152.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.152.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.153.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.153.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.153.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.154.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.154.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.154.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.155.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.155.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.155.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.156.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.156.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.156.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.157.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.157.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.157.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.158.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.158.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.158.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.159.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.159.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.159.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.160.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.160.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.160.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.161.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.161.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.161.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.162.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.162.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.162.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.163.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.163.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.163.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.164.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.164.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.164.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.165.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.165.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.165.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.166.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.166.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.166.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.167.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.167.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.167.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.168.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.168.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.168.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.169.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.169.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.169.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.170.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.170.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.170.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.171.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.171.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.171.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.172.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.172.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.172.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.173.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.173.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.173.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.174.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.174.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.174.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.175.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.175.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.175.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.176.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.176.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.176.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.177.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.177.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.177.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.178.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.178.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.178.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.179.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.179.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.179.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.180.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.180.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.180.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.181.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.181.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.181.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.182.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.182.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.182.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.183.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.183.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.183.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.184.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.184.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.184.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.185.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.185.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.185.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.186.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.186.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.186.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.187.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.187.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.187.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.188.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.188.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.188.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.189.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.189.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.189.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.190.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.190.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.190.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.191.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.191.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.191.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.192.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.192.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.192.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.193.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.193.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.193.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.194.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.194.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.194.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.195.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.195.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.195.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.196.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.196.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.196.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.197.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.197.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.197.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.198.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.198.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.198.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.199.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.199.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.199.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.200.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.200.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.200.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.201.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.201.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.201.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.202.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.202.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.202.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.203.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.203.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.203.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.204.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.204.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.204.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.205.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.205.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.205.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.206.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.206.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.206.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.207.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.207.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.207.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.208.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.208.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.208.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.209.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.209.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.209.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.210.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.210.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.210.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.211.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.211.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.211.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.212.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.212.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.212.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.213.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.213.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.213.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.214.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.214.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.214.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.215.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.215.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.215.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.216.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.216.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.216.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.217.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.217.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.217.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.218.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.218.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.218.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.219.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.219.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.219.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.220.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.220.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.220.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.221.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.221.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.221.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.222.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.222.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.222.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.223.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.223.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.223.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.224.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.224.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.224.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.225.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.225.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.225.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.226.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.226.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.226.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.227.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.227.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.227.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.228.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.228.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.228.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.229.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.229.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.229.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.230.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.230.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.230.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.231.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.231.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.231.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.232.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.232.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.232.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.233.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.233.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.233.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.234.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.234.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.234.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.235.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.235.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.235.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.236.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.236.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.236.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.237.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.237.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.237.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.238.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.238.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.238.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.239.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.239.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.239.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.240.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.240.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.240.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.241.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.241.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.241.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.242.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.242.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.242.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.243.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.243.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.243.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.244.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.244.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.244.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.245.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.245.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.245.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.246.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.246.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.246.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.247.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.247.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.247.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.248.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.248.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.248.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.249.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.249.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.249.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.250.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.250.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.250.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.251.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.251.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.251.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.252.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.252.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.252.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.253.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.253.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.253.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.254.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.254.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.254.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.255.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.255.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.255.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.56.input_layernorm.weight": "model-00150-of-000163.safetensors", + "model.layers.56.post_attention_layernorm.weight": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.q_a_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.q_a_layernorm.weight": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.q_b_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.kv_a_proj_with_mqa.weight": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.kv_a_layernorm.weight": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.kv_b_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.o_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.gate.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.gate.e_score_correction_bias": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.shared_experts.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.shared_experts.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.shared_experts.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.0.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.0.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.0.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.1.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.1.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.1.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.2.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.2.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.2.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.3.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.3.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.3.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.4.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.4.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.4.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.5.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.5.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.5.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.6.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.6.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.6.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.7.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.7.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.7.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.8.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.8.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.8.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.9.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.9.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.9.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.10.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.10.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.10.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.11.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.11.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.11.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.12.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.12.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.12.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.13.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.13.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.13.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.14.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.14.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.14.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.15.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.15.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.15.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.16.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.16.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.16.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.17.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.17.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.17.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.18.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.18.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.18.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.19.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.19.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.19.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.20.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.20.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.20.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.21.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.21.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.21.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.22.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.22.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.22.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.23.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.23.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.23.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.24.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.24.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.24.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.25.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.25.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.25.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.26.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.26.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.26.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.27.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.27.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.27.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.28.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.28.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.28.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.29.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.29.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.29.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.30.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.30.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.30.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.31.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.31.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.31.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.32.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.32.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.32.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.33.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.33.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.33.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.34.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.34.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.34.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.35.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.35.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.35.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.36.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.36.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.36.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.37.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.37.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.37.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.38.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.38.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.38.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.39.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.39.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.39.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.40.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.40.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.40.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.41.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.41.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.41.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.42.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.42.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.42.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.43.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.43.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.43.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.44.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.44.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.44.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.45.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.45.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.45.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.46.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.46.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.46.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.47.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.47.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.47.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.48.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.48.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.48.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.49.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.49.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.49.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.50.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.50.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.50.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.51.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.51.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.51.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.52.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.52.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.52.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.53.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.53.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.53.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.54.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.54.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.54.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.55.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.55.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.55.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.56.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.56.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.56.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.57.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.57.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.57.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.58.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.58.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.58.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.59.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.59.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.59.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.60.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.60.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.60.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.61.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.61.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.61.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.62.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.62.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.62.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.63.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.63.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.63.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.64.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.64.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.64.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.65.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.65.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.65.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.66.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.66.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.66.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.67.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.67.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.67.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.68.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.68.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.68.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.69.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.69.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.69.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.70.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.70.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.70.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.71.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.71.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.71.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.72.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.72.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.72.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.73.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.73.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.73.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.74.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.74.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.74.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.75.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.75.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.75.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.76.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.76.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.76.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.77.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.77.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.77.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.78.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.78.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.78.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.79.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.79.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.79.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.80.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.80.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.80.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.81.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.81.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.81.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.82.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.82.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.82.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.83.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.83.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.83.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.84.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.84.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.84.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.85.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.85.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.85.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.86.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.86.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.86.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.87.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.87.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.87.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.88.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.88.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.88.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.89.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.89.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.89.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.90.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.90.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.90.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.91.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.91.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.91.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.92.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.92.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.92.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.93.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.93.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.93.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.94.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.94.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.94.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.95.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.95.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.95.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.96.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.96.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.96.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.97.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.97.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.97.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.98.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.98.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.98.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.99.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.99.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.99.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.100.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.100.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.100.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.101.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.101.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.101.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.102.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.102.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.102.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.103.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.103.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.103.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.104.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.104.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.104.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.105.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.105.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.105.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.106.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.106.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.106.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.107.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.107.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.107.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.108.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.108.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.108.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.109.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.109.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.109.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.110.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.110.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.110.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.111.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.111.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.111.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.112.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.112.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.112.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.113.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.113.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.113.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.114.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.114.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.114.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.115.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.115.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.115.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.116.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.116.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.116.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.117.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.117.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.117.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.118.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.118.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.118.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.119.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.119.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.119.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.120.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.120.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.120.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.121.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.121.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.121.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.122.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.122.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.122.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.123.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.123.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.123.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.124.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.124.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.124.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.125.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.125.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.125.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.126.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.126.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.126.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.127.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.127.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.127.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.128.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.128.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.128.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.129.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.129.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.129.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.130.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.130.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.130.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.131.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.131.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.131.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.132.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.132.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.132.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.133.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.133.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.133.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.134.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.134.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.134.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.135.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.135.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.135.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.136.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.136.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.136.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.137.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.137.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.137.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.138.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.138.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.138.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.139.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.139.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.139.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.140.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.140.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.140.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.141.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.141.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.141.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.142.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.142.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.142.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.143.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.143.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.143.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.144.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.144.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.144.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.145.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.145.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.145.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.146.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.146.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.146.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.147.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.147.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.147.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.148.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.148.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.148.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.149.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.149.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.149.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.150.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.150.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.150.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.151.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.151.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.151.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.152.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.152.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.152.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.153.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.153.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.153.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.154.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.154.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.154.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.155.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.155.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.155.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.156.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.156.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.156.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.157.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.157.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.157.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.158.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.158.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.158.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.159.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.159.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.159.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.160.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.160.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.160.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.161.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.161.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.161.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.162.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.162.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.162.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.163.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.163.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.163.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.164.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.164.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.164.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.165.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.165.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.165.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.166.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.166.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.166.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.167.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.167.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.167.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.168.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.168.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.168.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.169.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.169.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.169.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.170.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.170.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.170.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.171.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.171.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.171.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.172.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.172.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.172.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.173.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.173.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.173.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.174.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.174.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.174.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.175.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.175.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.175.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.176.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.176.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.176.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.177.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.177.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.177.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.178.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.178.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.178.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.179.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.179.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.179.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.180.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.180.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.180.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.181.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.181.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.181.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.182.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.182.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.182.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.183.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.183.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.183.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.184.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.184.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.184.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.185.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.185.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.185.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.186.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.186.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.186.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.187.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.187.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.187.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.188.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.188.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.188.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.189.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.189.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.189.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.190.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.190.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.190.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.191.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.191.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.191.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.192.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.192.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.192.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.193.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.193.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.193.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.194.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.194.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.194.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.195.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.195.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.195.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.196.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.196.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.196.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.197.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.197.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.197.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.198.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.198.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.198.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.199.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.199.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.199.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.200.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.200.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.200.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.201.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.201.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.201.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.202.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.202.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.202.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.203.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.203.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.203.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.204.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.204.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.204.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.205.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.205.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.205.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.206.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.206.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.206.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.207.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.207.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.207.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.208.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.208.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.208.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.209.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.209.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.209.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.210.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.210.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.210.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.211.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.211.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.211.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.212.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.212.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.212.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.213.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.213.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.213.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.214.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.214.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.214.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.215.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.215.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.215.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.216.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.216.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.216.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.217.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.217.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.217.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.218.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.218.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.218.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.219.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.219.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.219.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.220.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.220.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.220.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.221.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.221.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.221.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.222.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.222.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.222.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.223.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.223.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.223.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.224.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.224.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.224.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.225.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.225.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.225.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.226.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.226.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.226.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.227.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.227.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.227.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.228.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.228.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.228.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.229.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.229.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.229.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.230.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.230.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.230.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.231.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.231.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.231.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.232.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.232.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.232.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.233.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.233.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.233.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.234.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.234.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.234.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.235.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.235.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.235.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.236.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.236.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.236.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.237.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.237.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.237.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.238.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.238.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.238.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.239.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.239.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.239.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.240.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.240.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.240.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.241.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.241.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.241.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.242.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.242.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.242.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.243.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.243.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.243.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.244.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.244.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.244.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.245.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.245.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.245.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.246.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.246.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.246.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.247.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.247.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.247.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.248.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.248.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.248.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.249.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.249.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.249.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.250.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.250.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.250.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.251.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.251.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.251.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.252.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.252.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.252.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.253.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.253.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.253.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.254.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.254.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.254.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.255.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.255.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.255.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.input_layernorm.weight": "model-00152-of-000163.safetensors", + "model.layers.57.post_attention_layernorm.weight": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.q_a_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.q_a_layernorm.weight": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.q_b_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.kv_a_proj_with_mqa.weight": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.kv_a_layernorm.weight": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.kv_b_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.o_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.gate.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.gate.e_score_correction_bias": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.shared_experts.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.shared_experts.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.shared_experts.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.0.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.0.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.0.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.1.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.1.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.1.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.2.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.2.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.2.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.3.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.3.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.3.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.4.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.4.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.4.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.5.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.5.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.5.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.6.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.6.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.6.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.7.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.7.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.7.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.8.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.8.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.8.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.9.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.9.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.9.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.10.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.10.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.10.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.11.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.11.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.11.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.12.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.12.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.12.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.13.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.13.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.13.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.14.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.14.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.14.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.15.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.15.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.15.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.16.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.16.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.16.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.17.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.17.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.17.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.18.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.18.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.18.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.19.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.19.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.19.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.20.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.20.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.20.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.21.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.21.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.21.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.22.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.22.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.22.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.23.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.23.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.23.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.24.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.24.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.24.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.25.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.25.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.25.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.26.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.26.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.26.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.27.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.27.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.27.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.28.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.28.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.28.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.29.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.29.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.29.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.30.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.30.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.30.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.31.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.31.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.31.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.32.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.32.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.32.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.33.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.33.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.33.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.34.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.34.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.34.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.35.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.35.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.35.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.36.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.36.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.36.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.37.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.37.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.37.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.38.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.38.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.38.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.39.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.39.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.39.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.40.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.40.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.40.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.41.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.41.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.41.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.42.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.42.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.42.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.43.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.43.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.43.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.44.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.44.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.44.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.45.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.45.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.45.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.46.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.46.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.46.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.47.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.47.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.47.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.48.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.48.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.48.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.49.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.49.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.49.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.50.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.50.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.50.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.51.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.51.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.51.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.52.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.52.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.52.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.53.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.53.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.53.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.54.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.54.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.54.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.55.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.55.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.55.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.56.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.56.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.56.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.57.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.57.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.57.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.58.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.58.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.58.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.59.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.59.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.59.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.60.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.60.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.60.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.61.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.61.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.61.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.62.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.62.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.62.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.63.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.63.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.63.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.64.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.64.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.64.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.65.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.65.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.65.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.66.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.66.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.66.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.67.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.67.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.67.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.68.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.68.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.68.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.69.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.69.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.69.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.70.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.70.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.70.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.71.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.71.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.71.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.72.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.72.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.72.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.73.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.73.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.73.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.74.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.74.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.74.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.75.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.75.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.75.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.76.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.76.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.76.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.77.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.77.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.77.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.78.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.78.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.78.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.79.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.79.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.79.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.80.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.80.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.80.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.81.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.81.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.81.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.82.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.82.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.82.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.83.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.83.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.83.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.84.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.84.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.84.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.85.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.85.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.85.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.86.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.86.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.86.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.87.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.87.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.87.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.88.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.88.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.88.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.89.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.89.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.89.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.90.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.90.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.90.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.91.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.91.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.91.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.92.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.92.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.92.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.93.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.93.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.93.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.94.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.94.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.94.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.95.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.95.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.95.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.96.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.96.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.96.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.97.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.97.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.97.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.98.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.98.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.98.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.99.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.99.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.99.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.100.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.100.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.100.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.101.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.101.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.101.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.102.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.102.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.102.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.103.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.103.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.103.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.104.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.104.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.104.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.105.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.105.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.105.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.106.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.106.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.106.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.107.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.107.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.107.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.108.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.108.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.108.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.109.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.109.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.109.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.110.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.110.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.110.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.111.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.111.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.111.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.112.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.112.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.112.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.113.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.113.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.113.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.114.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.114.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.114.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.115.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.115.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.115.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.116.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.116.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.116.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.117.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.117.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.117.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.118.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.118.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.118.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.119.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.119.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.119.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.120.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.120.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.120.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.121.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.121.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.121.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.122.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.122.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.122.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.123.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.123.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.123.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.124.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.124.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.124.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.125.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.125.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.125.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.126.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.126.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.126.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.127.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.127.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.127.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.128.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.128.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.128.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.129.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.129.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.129.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.130.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.130.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.130.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.131.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.131.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.131.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.132.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.132.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.132.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.133.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.133.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.133.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.134.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.134.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.134.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.135.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.135.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.135.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.136.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.136.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.136.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.137.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.137.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.137.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.138.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.138.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.138.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.139.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.139.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.139.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.140.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.140.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.140.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.141.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.141.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.141.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.142.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.142.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.142.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.143.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.143.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.143.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.144.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.144.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.144.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.145.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.145.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.145.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.146.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.146.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.146.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.147.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.147.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.147.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.148.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.148.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.148.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.149.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.149.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.149.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.150.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.150.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.150.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.151.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.151.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.151.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.152.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.152.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.152.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.153.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.153.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.153.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.154.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.154.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.154.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.155.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.155.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.155.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.156.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.156.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.156.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.157.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.157.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.157.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.158.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.158.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.158.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.159.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.159.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.159.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.160.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.160.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.160.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.161.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.161.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.161.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.162.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.162.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.162.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.163.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.163.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.163.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.164.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.164.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.164.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.165.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.165.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.165.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.166.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.166.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.166.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.167.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.167.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.167.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.168.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.168.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.168.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.169.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.169.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.169.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.170.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.170.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.170.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.171.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.171.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.171.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.172.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.172.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.172.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.173.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.173.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.173.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.174.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.174.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.174.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.175.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.175.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.175.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.176.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.176.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.176.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.177.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.177.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.177.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.178.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.178.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.178.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.179.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.179.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.179.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.180.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.180.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.180.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.181.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.181.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.181.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.182.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.182.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.182.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.183.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.183.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.183.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.184.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.184.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.184.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.185.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.185.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.185.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.186.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.186.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.186.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.187.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.187.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.187.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.188.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.188.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.188.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.189.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.189.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.189.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.190.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.190.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.190.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.191.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.191.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.191.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.192.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.192.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.192.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.193.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.193.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.193.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.194.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.194.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.194.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.195.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.195.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.195.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.196.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.196.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.196.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.197.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.197.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.197.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.198.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.198.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.198.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.199.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.199.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.199.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.200.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.200.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.200.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.201.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.201.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.201.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.202.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.202.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.202.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.203.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.203.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.203.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.204.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.204.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.204.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.205.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.205.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.205.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.206.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.206.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.206.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.207.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.207.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.207.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.208.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.208.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.208.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.209.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.209.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.209.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.210.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.210.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.210.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.211.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.211.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.211.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.212.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.212.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.212.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.213.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.213.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.213.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.214.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.214.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.214.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.215.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.215.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.215.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.216.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.216.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.216.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.217.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.217.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.217.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.218.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.218.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.218.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.219.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.219.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.219.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.220.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.220.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.220.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.221.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.221.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.221.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.222.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.222.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.222.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.223.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.223.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.223.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.224.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.224.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.224.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.225.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.225.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.225.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.226.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.226.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.226.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.227.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.227.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.227.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.228.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.228.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.228.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.229.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.229.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.229.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.230.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.230.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.230.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.231.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.231.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.231.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.232.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.232.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.232.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.233.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.233.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.233.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.234.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.234.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.234.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.235.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.235.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.235.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.236.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.236.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.236.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.237.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.237.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.237.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.238.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.238.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.238.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.239.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.239.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.239.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.240.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.240.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.240.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.241.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.241.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.241.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.242.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.242.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.242.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.243.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.243.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.243.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.244.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.244.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.244.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.245.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.245.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.245.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.246.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.246.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.246.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.247.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.247.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.247.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.248.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.248.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.248.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.249.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.249.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.249.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.250.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.250.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.250.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.251.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.251.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.251.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.252.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.252.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.252.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.253.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.253.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.253.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.254.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.254.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.254.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.255.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.255.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.255.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.input_layernorm.weight": "model-00155-of-000163.safetensors", + "model.layers.58.post_attention_layernorm.weight": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.q_a_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.q_a_layernorm.weight": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.q_b_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.kv_a_proj_with_mqa.weight": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.kv_a_layernorm.weight": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.kv_b_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.o_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.gate.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.gate.e_score_correction_bias": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.shared_experts.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.shared_experts.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.shared_experts.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.0.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.0.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.0.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.1.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.1.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.1.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.2.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.2.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.2.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.3.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.3.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.3.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.4.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.4.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.4.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.5.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.5.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.5.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.6.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.6.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.6.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.7.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.7.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.7.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.8.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.8.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.8.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.9.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.9.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.9.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.10.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.10.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.10.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.11.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.11.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.11.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.12.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.12.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.12.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.13.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.13.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.13.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.14.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.14.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.14.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.15.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.15.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.15.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.16.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.16.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.16.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.17.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.17.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.17.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.18.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.18.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.18.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.19.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.19.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.19.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.20.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.20.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.20.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.21.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.21.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.21.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.22.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.22.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.22.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.23.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.23.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.23.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.24.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.24.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.24.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.25.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.25.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.25.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.26.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.26.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.26.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.27.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.27.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.27.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.28.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.28.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.28.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.29.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.29.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.29.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.30.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.30.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.30.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.31.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.31.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.31.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.32.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.32.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.32.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.33.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.33.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.33.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.34.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.34.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.34.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.35.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.35.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.35.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.36.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.36.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.36.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.37.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.37.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.37.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.38.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.38.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.38.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.39.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.39.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.39.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.40.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.40.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.40.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.41.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.41.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.41.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.42.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.42.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.42.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.43.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.43.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.43.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.44.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.44.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.44.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.45.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.45.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.45.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.46.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.46.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.46.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.47.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.47.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.47.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.48.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.48.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.48.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.49.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.49.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.49.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.50.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.50.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.50.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.51.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.51.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.51.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.52.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.52.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.52.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.53.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.53.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.53.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.54.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.54.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.54.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.55.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.55.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.55.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.56.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.56.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.56.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.57.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.57.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.57.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.58.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.58.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.58.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.59.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.59.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.59.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.60.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.60.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.60.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.61.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.61.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.61.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.62.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.62.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.62.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.63.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.63.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.63.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.64.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.64.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.64.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.65.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.65.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.65.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.66.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.66.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.66.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.67.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.67.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.67.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.68.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.68.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.68.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.69.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.69.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.69.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.70.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.70.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.70.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.71.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.71.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.71.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.72.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.72.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.72.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.73.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.73.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.73.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.74.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.74.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.74.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.75.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.75.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.75.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.76.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.76.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.76.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.77.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.77.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.77.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.78.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.78.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.78.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.79.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.79.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.79.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.80.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.80.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.80.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.81.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.81.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.81.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.82.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.82.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.82.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.83.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.83.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.83.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.84.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.84.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.84.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.85.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.85.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.85.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.86.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.86.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.86.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.87.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.87.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.87.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.88.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.88.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.88.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.89.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.89.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.89.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.90.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.90.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.90.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.91.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.91.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.91.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.92.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.92.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.92.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.93.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.93.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.93.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.94.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.94.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.94.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.95.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.95.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.95.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.96.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.96.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.96.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.97.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.97.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.97.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.98.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.98.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.98.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.99.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.99.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.99.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.100.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.100.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.100.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.101.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.101.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.101.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.102.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.102.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.102.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.103.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.103.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.103.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.104.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.104.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.104.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.105.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.105.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.105.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.106.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.106.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.106.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.107.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.107.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.107.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.108.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.108.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.108.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.109.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.109.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.109.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.110.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.110.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.110.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.111.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.111.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.111.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.112.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.112.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.112.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.113.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.113.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.113.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.114.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.114.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.114.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.115.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.115.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.115.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.116.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.116.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.116.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.117.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.117.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.117.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.118.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.118.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.118.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.119.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.119.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.119.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.120.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.120.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.120.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.121.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.121.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.121.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.122.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.122.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.122.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.123.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.123.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.123.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.124.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.124.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.124.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.125.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.125.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.125.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.126.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.126.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.126.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.127.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.127.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.127.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.128.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.128.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.128.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.129.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.129.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.129.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.130.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.130.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.130.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.131.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.131.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.131.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.132.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.132.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.132.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.133.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.133.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.133.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.134.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.134.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.134.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.135.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.135.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.135.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.136.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.136.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.136.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.137.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.137.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.137.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.138.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.138.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.138.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.139.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.139.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.139.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.140.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.140.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.140.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.141.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.141.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.141.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.142.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.142.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.142.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.143.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.143.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.143.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.144.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.144.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.144.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.145.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.145.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.145.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.146.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.146.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.146.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.147.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.147.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.147.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.148.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.148.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.148.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.149.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.149.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.149.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.150.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.150.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.150.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.151.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.151.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.151.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.152.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.152.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.152.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.153.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.153.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.153.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.154.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.154.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.154.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.155.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.155.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.155.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.156.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.156.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.156.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.157.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.157.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.157.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.158.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.158.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.158.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.159.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.159.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.159.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.160.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.160.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.160.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.161.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.161.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.161.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.162.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.162.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.162.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.163.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.163.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.163.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.164.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.164.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.164.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.165.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.165.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.165.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.166.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.166.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.166.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.167.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.167.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.167.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.168.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.168.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.168.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.169.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.169.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.169.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.170.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.170.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.170.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.171.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.171.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.171.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.172.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.172.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.172.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.173.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.173.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.173.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.174.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.174.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.174.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.175.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.175.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.175.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.176.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.176.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.176.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.177.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.177.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.177.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.178.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.178.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.178.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.179.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.179.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.179.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.180.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.180.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.180.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.181.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.181.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.181.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.182.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.182.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.182.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.183.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.183.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.183.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.184.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.184.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.184.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.185.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.185.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.185.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.186.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.186.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.186.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.187.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.187.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.187.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.188.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.188.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.188.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.189.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.189.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.189.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.190.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.190.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.190.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.191.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.191.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.191.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.192.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.192.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.192.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.193.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.193.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.193.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.194.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.194.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.194.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.195.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.195.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.195.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.196.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.196.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.196.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.197.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.197.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.197.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.198.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.198.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.198.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.199.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.199.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.199.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.200.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.200.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.200.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.201.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.201.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.201.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.202.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.202.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.202.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.203.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.203.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.203.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.204.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.204.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.204.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.205.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.205.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.205.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.206.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.206.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.206.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.207.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.207.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.207.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.208.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.208.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.208.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.209.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.209.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.209.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.210.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.210.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.210.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.211.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.211.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.211.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.212.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.212.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.212.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.213.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.213.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.213.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.214.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.214.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.214.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.215.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.215.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.215.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.216.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.216.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.216.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.217.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.217.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.217.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.218.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.218.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.218.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.219.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.219.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.219.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.220.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.220.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.220.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.221.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.221.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.221.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.222.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.222.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.222.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.223.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.223.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.223.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.224.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.224.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.224.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.225.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.225.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.225.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.226.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.226.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.226.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.227.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.227.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.227.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.228.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.228.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.228.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.229.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.229.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.229.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.230.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.230.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.230.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.231.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.231.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.231.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.232.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.232.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.232.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.233.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.233.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.233.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.234.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.234.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.234.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.235.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.235.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.235.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.236.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.236.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.236.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.237.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.237.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.237.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.238.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.238.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.238.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.239.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.239.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.239.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.240.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.240.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.240.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.241.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.241.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.241.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.242.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.242.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.242.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.243.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.243.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.243.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.244.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.244.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.244.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.245.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.245.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.245.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.246.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.246.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.246.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.247.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.247.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.247.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.248.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.248.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.248.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.249.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.249.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.249.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.250.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.250.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.250.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.251.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.251.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.251.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.252.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.252.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.252.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.253.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.253.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.253.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.254.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.254.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.254.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.255.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.255.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.255.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.input_layernorm.weight": "model-00158-of-000163.safetensors", + "model.layers.59.post_attention_layernorm.weight": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.q_a_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.q_a_layernorm.weight": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.q_b_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.kv_a_proj_with_mqa.weight": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.kv_a_layernorm.weight": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.kv_b_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.o_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.gate.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.gate.e_score_correction_bias": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.shared_experts.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.shared_experts.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.shared_experts.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.0.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.0.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.0.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.1.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.1.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.1.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.2.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.2.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.2.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.3.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.3.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.3.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.4.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.4.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.4.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.5.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.5.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.5.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.6.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.6.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.6.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.7.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.7.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.7.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.8.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.8.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.8.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.9.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.9.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.9.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.10.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.10.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.10.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.11.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.11.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.11.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.12.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.12.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.12.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.13.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.13.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.13.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.14.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.14.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.14.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.15.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.15.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.15.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.16.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.16.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.16.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.17.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.17.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.17.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.18.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.18.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.18.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.19.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.19.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.19.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.20.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.20.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.20.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.21.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.21.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.21.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.22.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.22.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.22.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.23.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.23.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.23.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.24.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.24.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.24.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.25.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.25.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.25.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.26.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.26.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.26.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.27.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.27.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.27.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.28.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.28.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.28.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.29.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.29.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.29.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.30.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.30.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.30.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.31.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.31.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.31.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.32.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.32.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.32.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.33.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.33.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.33.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.34.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.34.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.34.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.35.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.35.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.35.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.36.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.36.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.36.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.37.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.37.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.37.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.38.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.38.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.38.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.39.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.39.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.39.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.40.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.40.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.40.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.41.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.41.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.41.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.42.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.42.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.42.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.43.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.43.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.43.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.44.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.44.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.44.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.45.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.45.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.45.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.46.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.46.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.46.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.47.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.47.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.47.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.48.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.48.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.48.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.49.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.49.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.49.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.50.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.50.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.50.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.51.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.51.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.51.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.52.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.52.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.52.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.53.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.53.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.53.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.54.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.54.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.54.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.55.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.55.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.55.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.56.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.56.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.56.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.57.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.57.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.57.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.58.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.58.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.58.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.59.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.59.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.59.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.60.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.60.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.60.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.61.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.61.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.61.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.62.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.62.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.62.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.63.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.63.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.63.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.64.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.64.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.64.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.65.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.65.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.65.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.66.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.66.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.66.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.67.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.67.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.67.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.68.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.68.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.68.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.69.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.69.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.69.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.70.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.70.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.70.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.71.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.71.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.71.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.72.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.72.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.72.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.73.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.73.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.73.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.74.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.74.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.74.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.75.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.75.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.75.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.76.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.76.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.76.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.77.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.77.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.77.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.78.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.78.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.78.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.79.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.79.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.79.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.80.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.80.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.80.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.81.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.81.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.81.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.82.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.82.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.82.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.83.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.83.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.83.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.84.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.84.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.84.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.85.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.85.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.85.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.86.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.86.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.86.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.87.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.87.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.87.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.88.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.88.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.88.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.89.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.89.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.89.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.90.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.90.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.90.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.91.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.91.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.91.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.92.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.92.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.92.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.93.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.93.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.93.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.94.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.94.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.94.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.95.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.95.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.95.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.96.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.96.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.96.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.97.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.97.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.97.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.98.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.98.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.98.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.99.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.99.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.99.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.100.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.100.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.100.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.101.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.101.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.101.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.102.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.102.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.102.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.103.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.103.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.103.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.104.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.104.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.104.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.105.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.105.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.105.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.106.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.106.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.106.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.107.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.107.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.107.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.108.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.108.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.108.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.109.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.109.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.109.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.110.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.110.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.110.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.111.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.111.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.111.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.112.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.112.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.112.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.113.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.113.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.113.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.114.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.114.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.114.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.115.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.115.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.115.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.116.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.116.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.116.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.117.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.117.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.117.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.118.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.118.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.118.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.119.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.119.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.119.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.120.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.120.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.120.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.121.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.121.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.121.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.122.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.122.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.122.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.123.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.123.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.123.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.124.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.124.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.124.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.125.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.125.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.125.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.126.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.126.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.126.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.127.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.127.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.127.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.128.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.128.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.128.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.129.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.129.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.129.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.130.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.130.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.130.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.131.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.131.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.131.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.132.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.132.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.132.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.133.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.133.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.133.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.134.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.134.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.134.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.135.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.135.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.135.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.136.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.136.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.136.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.137.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.137.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.137.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.138.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.138.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.138.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.139.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.139.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.139.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.140.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.140.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.140.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.141.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.141.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.141.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.142.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.142.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.142.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.143.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.143.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.143.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.144.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.144.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.144.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.145.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.145.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.145.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.146.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.146.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.146.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.147.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.147.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.147.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.148.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.148.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.148.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.149.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.149.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.149.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.150.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.150.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.150.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.151.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.151.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.151.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.152.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.152.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.152.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.153.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.153.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.153.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.154.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.154.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.154.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.155.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.155.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.155.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.156.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.156.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.156.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.157.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.157.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.157.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.158.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.158.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.158.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.159.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.159.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.159.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.160.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.160.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.160.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.161.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.161.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.161.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.162.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.162.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.162.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.163.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.163.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.163.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.164.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.164.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.164.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.165.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.165.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.165.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.166.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.166.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.166.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.167.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.167.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.167.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.168.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.168.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.168.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.169.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.169.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.169.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.170.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.170.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.170.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.171.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.171.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.171.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.172.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.172.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.172.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.173.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.173.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.173.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.174.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.174.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.174.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.175.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.175.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.175.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.176.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.176.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.176.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.177.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.177.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.177.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.178.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.178.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.178.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.179.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.179.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.179.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.180.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.180.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.180.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.181.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.181.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.181.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.182.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.182.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.182.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.183.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.183.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.183.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.184.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.184.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.184.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.185.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.185.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.185.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.186.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.186.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.186.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.187.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.187.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.187.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.188.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.188.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.188.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.189.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.189.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.189.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.190.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.190.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.190.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.191.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.191.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.191.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.192.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.192.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.192.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.193.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.193.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.193.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.194.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.194.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.194.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.195.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.195.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.195.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.196.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.196.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.196.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.197.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.197.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.197.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.198.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.198.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.198.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.199.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.199.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.199.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.200.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.200.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.200.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.201.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.201.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.201.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.202.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.202.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.202.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.203.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.203.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.203.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.204.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.204.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.204.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.205.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.205.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.205.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.206.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.206.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.206.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.207.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.207.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.207.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.208.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.208.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.208.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.209.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.209.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.209.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.210.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.210.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.210.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.211.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.211.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.211.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.212.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.212.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.212.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.213.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.213.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.213.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.214.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.214.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.214.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.215.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.215.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.215.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.216.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.216.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.216.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.217.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.217.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.217.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.218.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.218.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.218.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.219.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.219.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.219.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.220.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.220.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.220.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.221.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.221.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.221.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.222.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.222.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.222.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.223.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.223.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.223.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.224.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.224.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.224.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.225.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.225.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.225.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.226.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.226.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.226.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.227.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.227.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.227.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.228.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.228.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.228.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.229.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.229.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.229.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.230.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.230.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.230.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.231.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.231.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.231.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.232.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.232.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.232.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.233.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.233.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.233.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.234.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.234.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.234.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.235.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.235.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.235.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.236.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.236.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.236.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.237.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.237.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.237.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.238.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.238.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.238.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.239.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.239.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.239.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.240.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.240.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.240.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.241.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.241.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.241.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.242.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.242.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.242.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.243.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.243.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.243.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.244.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.244.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.244.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.245.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.245.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.245.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.246.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.246.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.246.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.247.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.247.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.247.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.248.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.248.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.248.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.249.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.249.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.249.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.250.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.250.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.250.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.251.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.251.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.251.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.252.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.252.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.252.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.253.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.253.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.253.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.254.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.254.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.254.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.255.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.255.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.255.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.input_layernorm.weight": "model-00160-of-000163.safetensors", + "model.layers.60.post_attention_layernorm.weight": "model-00160-of-000163.safetensors", + "model.norm.weight": "model-00160-of-000163.safetensors", + "lm_head.weight": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.q_a_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.q_a_layernorm.weight": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.q_b_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.kv_a_proj_with_mqa.weight": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.kv_a_layernorm.weight": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.kv_b_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.o_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.61.mlp.gate.weight": "model-00160-of-000163.safetensors", + "model.layers.61.mlp.gate.e_score_correction_bias": "model-00160-of-000163.safetensors", + "model.layers.61.mlp.shared_experts.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.61.mlp.shared_experts.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.61.mlp.shared_experts.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.61.mlp.experts.0.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.0.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.0.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.1.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.1.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.1.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.2.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.2.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.2.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.3.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.3.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.3.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.4.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.4.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.4.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.5.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.5.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.5.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.6.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.6.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.6.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.7.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.7.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.7.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.8.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.8.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.8.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.9.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.9.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.9.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.10.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.10.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.10.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.11.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.11.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.11.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.12.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.12.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.12.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.13.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.13.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.13.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.14.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.14.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.14.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.15.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.15.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.15.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.16.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.16.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.16.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.17.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.17.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.17.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.18.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.18.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.18.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.19.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.19.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.19.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.20.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.20.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.20.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.21.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.21.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.21.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.22.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.22.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.22.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.23.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.23.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.23.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.24.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.24.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.24.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.25.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.25.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.25.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.26.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.26.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.26.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.27.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.27.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.27.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.28.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.28.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.28.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.29.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.29.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.29.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.30.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.30.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.30.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.31.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.31.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.31.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.32.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.32.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.32.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.33.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.33.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.33.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.34.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.34.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.34.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.35.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.35.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.35.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.36.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.36.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.36.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.37.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.37.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.37.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.38.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.38.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.38.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.39.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.39.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.39.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.40.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.40.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.40.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.41.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.41.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.41.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.42.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.42.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.42.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.43.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.43.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.43.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.44.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.44.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.44.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.45.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.45.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.45.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.46.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.46.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.46.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.47.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.47.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.47.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.48.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.48.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.48.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.49.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.49.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.49.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.50.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.50.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.50.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.51.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.51.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.51.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.52.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.52.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.52.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.53.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.53.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.53.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.54.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.54.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.54.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.55.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.55.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.55.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.56.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.56.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.56.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.57.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.57.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.57.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.58.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.58.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.58.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.59.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.59.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.59.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.60.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.60.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.60.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.61.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.61.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.61.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.62.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.62.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.62.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.63.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.63.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.63.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.64.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.64.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.64.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.65.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.65.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.65.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.66.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.66.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.66.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.67.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.67.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.67.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.68.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.68.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.68.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.69.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.69.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.69.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.70.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.70.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.70.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.71.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.71.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.71.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.72.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.72.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.72.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.73.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.73.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.73.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.74.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.74.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.74.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.75.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.75.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.75.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.76.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.76.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.76.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.77.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.77.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.77.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.78.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.78.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.78.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.79.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.79.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.79.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.80.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.80.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.80.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.81.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.81.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.81.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.82.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.82.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.82.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.83.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.83.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.83.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.84.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.84.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.84.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.85.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.85.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.85.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.86.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.86.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.86.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.87.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.87.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.87.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.88.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.88.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.88.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.89.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.89.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.89.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.90.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.90.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.90.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.91.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.91.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.91.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.92.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.92.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.92.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.93.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.93.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.93.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.94.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.94.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.94.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.95.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.95.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.95.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.96.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.96.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.96.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.97.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.97.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.97.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.98.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.98.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.98.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.99.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.99.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.99.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.100.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.100.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.100.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.101.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.101.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.101.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.102.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.102.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.102.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.103.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.103.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.103.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.104.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.104.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.104.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.105.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.105.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.105.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.106.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.106.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.106.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.107.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.107.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.107.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.108.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.108.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.108.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.109.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.109.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.109.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.110.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.110.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.110.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.111.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.111.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.111.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.112.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.112.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.112.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.113.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.113.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.113.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.114.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.114.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.114.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.115.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.115.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.115.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.116.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.116.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.116.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.117.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.117.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.117.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.118.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.118.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.118.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.119.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.119.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.119.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.120.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.120.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.120.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.121.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.121.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.121.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.122.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.122.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.122.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.123.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.123.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.123.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.124.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.124.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.124.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.125.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.125.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.125.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.126.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.126.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.126.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.127.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.127.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.127.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.128.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.128.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.128.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.129.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.129.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.129.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.130.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.130.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.130.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.131.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.131.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.131.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.132.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.132.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.132.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.133.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.133.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.133.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.134.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.134.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.134.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.135.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.135.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.135.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.136.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.136.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.136.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.137.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.137.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.137.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.138.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.138.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.138.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.139.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.139.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.139.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.140.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.140.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.140.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.141.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.141.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.141.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.142.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.142.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.142.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.143.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.143.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.143.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.144.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.144.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.144.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.145.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.145.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.145.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.146.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.146.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.146.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.147.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.147.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.147.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.148.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.148.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.148.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.149.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.149.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.149.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.150.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.150.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.150.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.151.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.151.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.151.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.152.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.152.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.152.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.153.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.153.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.153.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.154.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.154.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.154.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.155.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.155.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.155.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.156.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.156.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.156.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.157.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.157.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.157.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.158.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.158.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.158.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.159.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.159.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.159.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.160.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.160.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.160.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.161.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.161.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.161.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.162.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.162.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.162.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.163.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.163.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.163.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.164.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.164.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.164.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.165.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.165.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.165.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.166.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.166.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.166.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.167.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.167.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.167.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.168.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.168.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.168.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.169.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.169.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.169.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.170.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.170.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.170.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.171.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.171.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.171.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.172.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.172.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.172.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.173.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.173.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.173.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.174.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.174.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.174.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.175.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.175.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.175.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.176.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.176.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.176.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.177.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.177.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.177.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.178.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.178.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.178.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.179.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.179.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.179.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.180.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.180.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.180.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.181.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.181.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.181.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.182.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.182.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.182.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.183.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.183.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.183.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.184.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.184.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.184.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.185.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.185.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.185.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.186.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.186.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.186.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.187.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.187.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.187.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.188.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.188.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.188.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.189.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.189.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.189.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.190.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.190.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.190.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.191.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.191.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.191.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.192.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.192.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.192.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.193.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.193.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.193.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.194.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.194.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.194.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.195.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.195.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.195.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.196.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.196.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.196.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.197.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.197.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.197.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.198.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.198.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.198.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.199.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.199.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.199.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.200.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.200.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.200.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.201.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.201.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.201.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.202.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.202.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.202.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.203.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.203.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.203.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.204.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.204.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.204.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.205.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.205.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.205.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.206.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.206.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.206.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.207.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.207.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.207.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.208.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.208.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.208.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.209.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.209.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.209.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.210.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.210.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.210.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.211.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.211.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.211.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.212.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.212.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.212.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.213.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.213.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.213.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.214.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.214.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.214.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.215.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.215.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.215.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.216.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.216.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.216.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.217.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.217.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.217.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.218.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.218.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.218.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.219.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.219.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.219.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.220.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.220.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.220.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.221.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.221.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.221.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.222.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.222.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.222.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.223.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.223.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.223.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.224.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.224.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.224.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.225.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.225.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.225.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.226.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.226.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.226.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.227.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.227.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.227.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.228.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.228.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.228.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.229.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.229.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.229.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.230.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.230.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.230.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.231.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.231.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.231.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.232.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.232.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.232.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.233.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.233.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.233.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.234.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.234.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.234.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.235.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.235.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.235.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.236.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.236.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.236.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.237.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.237.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.237.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.238.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.238.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.238.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.239.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.239.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.239.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.240.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.240.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.240.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.241.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.241.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.241.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.242.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.242.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.242.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.243.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.243.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.243.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.244.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.244.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.244.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.245.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.245.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.245.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.246.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.246.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.246.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.247.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.247.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.247.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.248.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.248.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.248.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.249.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.249.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.249.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.250.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.250.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.250.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.251.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.251.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.251.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.252.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.252.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.252.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.253.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.253.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.253.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.254.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.254.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.254.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.255.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.255.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.255.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.input_layernorm.weight": "model-00163-of-000163.safetensors", + "model.layers.61.post_attention_layernorm.weight": "model-00163-of-000163.safetensors", + "model.layers.61.embed_tokens.weight": "model-00163-of-000163.safetensors", + "model.layers.61.enorm.weight": "model-00163-of-000163.safetensors", + "model.layers.61.hnorm.weight": "model-00163-of-000163.safetensors", + "model.layers.61.eh_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.shared_head.norm.weight": "model-00163-of-000163.safetensors", + "model.layers.61.shared_head.head.weight": "model-00163-of-000163.safetensors" + } +} \ No newline at end of file