diff --git a/.gitattributes b/.gitattributes index f877b2a68e2c78c07171ccbd8326cab014112705..0d4cb185280917cac60ef7195f2a6250b2b90d83 100644 --- a/.gitattributes +++ b/.gitattributes @@ -35,5 +35,3 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text tekken.json filter=lfs diff=lfs merge=lfs -text tokenizer.json filter=lfs diff=lfs merge=lfs -text -Mistral-Large-3-675B-Instruct-2512-BF16/tekken.json filter=lfs diff=lfs merge=lfs -text -Mistral-Large-3-675B-Instruct-2512-BF16/tokenizer.json filter=lfs diff=lfs merge=lfs -text diff --git a/Mistral-Large-3-675B-Instruct-2512-BF16/.gitattributes b/Mistral-Large-3-675B-Instruct-2512-BF16/.gitattributes new file mode 100644 index 0000000000000000000000000000000000000000..0d4cb185280917cac60ef7195f2a6250b2b90d83 --- /dev/null +++ b/Mistral-Large-3-675B-Instruct-2512-BF16/.gitattributes @@ -0,0 +1,37 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +tekken.json filter=lfs diff=lfs merge=lfs -text +tokenizer.json filter=lfs diff=lfs merge=lfs -text diff --git a/consolidated-00001-of-00272.safetensors b/consolidated-00001-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6112914cfed5a7a1a3bdd549417700f9e71c6dd4 --- /dev/null +++ b/consolidated-00001-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7135049bc93ff62de095e1d287cd946a1635efb74e313b28a48c123f555c124 +size 4998260600 diff --git a/consolidated-00002-of-00272.safetensors b/consolidated-00002-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a1ee49a11a2247cb6b7c3678b6eca3ff99054654 --- /dev/null +++ b/consolidated-00002-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bdafc45e53f2b2035f2e546a7123e8dee3d1661a37e423c47684b29fbbd440a +size 4991231040 diff --git a/consolidated-00003-of-00272.safetensors b/consolidated-00003-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2077332c4aaf8c8d5b0e33779336c5747330f188 --- /dev/null +++ b/consolidated-00003-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88ee12de716146875e8a1b49e7abbd08bb1c49aa5c8efec0b5bc9c24db1efdd0 +size 4991230984 diff --git a/consolidated-00004-of-00272.safetensors b/consolidated-00004-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5a3c05f7b61cec6017bf34122130c34798a01fc9 --- /dev/null +++ b/consolidated-00004-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d4d2e40f24c9fb0d6c469e4330cb71f8fd05200b9305e41281f450aabcfc4cf +size 4991230984 diff --git a/consolidated-00005-of-00272.safetensors b/consolidated-00005-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9c81681822eaa1c0149455d1f221895feffb96e0 --- /dev/null +++ b/consolidated-00005-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9472aa66fc83a2fa369c5cd11684d64d595eca5c71b3d8b4c617ef1fd16e19e +size 4991230984 diff --git a/consolidated-00006-of-00272.safetensors b/consolidated-00006-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0eda13992cdcf79855f4828fa09467edf3123bd1 --- /dev/null +++ b/consolidated-00006-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdbd39f06099297a5d484bc1327a7450cf3fcafb04c215b2cd64e623cb4edcfe +size 4956267912 diff --git a/consolidated-00007-of-00272.safetensors b/consolidated-00007-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..265697f8cb01f8ed38815750b47fabaafb60d24e --- /dev/null +++ b/consolidated-00007-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1712a6e1471f95e8d8a5728dd8792c247cc9ee53e8be80a9a5233e080654a39e +size 4991231008 diff --git a/consolidated-00008-of-00272.safetensors b/consolidated-00008-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1e19a0003cc3836ea557604f84967e482485edd4 --- /dev/null +++ b/consolidated-00008-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6cc472310038cf56838cbbe36b43f30f5f79c50ec9f41d631e5b428d4d4a5d0 +size 4991230984 diff --git a/consolidated-00009-of-00272.safetensors b/consolidated-00009-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bebbb26e620dc0df5d51b87b446aa53ff848552c --- /dev/null +++ b/consolidated-00009-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5a95f2d7ef3c8bf31bc3b9cec6a1f263e26bab673be15304d7f0e6cc2b289af +size 4991230984 diff --git a/consolidated-00010-of-00272.safetensors b/consolidated-00010-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..40d75dfa313d1f65342fc268667f9b0464f4cf2c --- /dev/null +++ b/consolidated-00010-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95795d9297ad590fb7c634a5ad5d4b4498e4054e52907b787ae3f85e32310a8e +size 4956267864 diff --git a/consolidated-00011-of-00272.safetensors b/consolidated-00011-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b873458e4c29f9cee871ea1a3f55155aec47ce4b --- /dev/null +++ b/consolidated-00011-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faf2c0b61d20a86bc3c95104a0c36533b54740437d980044cc985bdf4b8e64d8 +size 4991231064 diff --git a/consolidated-00012-of-00272.safetensors b/consolidated-00012-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cc9f0eae39e14dd810ea69db1dbde2918afe45d6 --- /dev/null +++ b/consolidated-00012-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e76fc9a92ba29ab0ce74b444686ff922287173192d1b47db23859c821dfb602 +size 4991230984 diff --git a/consolidated-00013-of-00272.safetensors b/consolidated-00013-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..327a6ff3049480830bea523348533a865d64a4c7 --- /dev/null +++ b/consolidated-00013-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a20a1531870d72103dd7c8558d693a1c596b681e60f7ea89bd34151fdc27b01 +size 4991230984 diff --git a/consolidated-00014-of-00272.safetensors b/consolidated-00014-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..702bdfd5988bd68333dfdb352dafd742636830ad --- /dev/null +++ b/consolidated-00014-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef7138911f14857cafa790f02c5f879b9b961277047394aac2222cd9b7f0da4d +size 4991230984 diff --git a/consolidated-00015-of-00272.safetensors b/consolidated-00015-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d897429e47c93203c8a209a1f79f75ecf6180f1c --- /dev/null +++ b/consolidated-00015-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72ae8fb431645d20e598aff80b3381dd1afe94c53dafe68ef43f32470fa44903 +size 4956267896 diff --git a/consolidated-00016-of-00272.safetensors b/consolidated-00016-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8fbbc8892def6116776486a460df6f332666728a --- /dev/null +++ b/consolidated-00016-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7d544e1d920b7c25763dfd83e85305ca1cc37c3f042bc473700f46031b99dd2 +size 4991231032 diff --git a/consolidated-00017-of-00272.safetensors b/consolidated-00017-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2be9b73e6aa5f947d20c0af882d8a463caf27b7a --- /dev/null +++ b/consolidated-00017-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a560c93a15f4a5335c4d2c2fd9a2572d2da07c826e680daa01d07fcba9862fb +size 4991230984 diff --git a/consolidated-00018-of-00272.safetensors b/consolidated-00018-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d9d41dd27415362bbde953154da8340396ce203f --- /dev/null +++ b/consolidated-00018-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6a460a2300ff522a00fc502c09eda78a279a95f5b8d7238a44be572d3970ad1 +size 4991230984 diff --git a/consolidated-00019-of-00272.safetensors b/consolidated-00019-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bb34821b918c8302ab6d958340692c1eba35d87b --- /dev/null +++ b/consolidated-00019-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61b8b2ecd9696418bf6c7210db78dc38983d1d571685cd0865fa3ca33befd82f +size 4858735960 diff --git a/consolidated-00020-of-00272.safetensors b/consolidated-00020-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9ab6183b31651d7d2d6a7d2f22393995e96b0e91 --- /dev/null +++ b/consolidated-00020-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f75191a82e853846060fbb54e94ff8e8d158250999c577c8f2013ee6e174149b +size 4971322232 diff --git a/consolidated-00021-of-00272.safetensors b/consolidated-00021-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fbe4fb2d997bd8bf5ddffe4453c977d437cc8ca4 --- /dev/null +++ b/consolidated-00021-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:973deca15ef833c2e7a16413821f4c73682d1fc78fa56e2a03e418bed28d7507 +size 4991231008 diff --git a/consolidated-00022-of-00272.safetensors b/consolidated-00022-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e1448235184bfb425b244acf7885f78f9cc7d74a --- /dev/null +++ b/consolidated-00022-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b1f3a4b7faf9d95a22a730cacf9d42606fe973a8e45c3a83ff9448ad35cbcc2 +size 4991230984 diff --git a/consolidated-00023-of-00272.safetensors b/consolidated-00023-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..af4e73538f8161cecf3b8592f26a617017fb6ef9 --- /dev/null +++ b/consolidated-00023-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:217af536f350a11a1ed9223ad3d2db16bf06eec8c261a9462a73880124c83dff +size 4991230984 diff --git a/consolidated-00024-of-00272.safetensors b/consolidated-00024-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d8ad47f1ebf8e313736291e8fedb11ddf94ff8d8 --- /dev/null +++ b/consolidated-00024-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c65b00234b93b5b83cd0102baa5bfea7b336d6bdda6c320d87b1034613b1a1d1 +size 4956267872 diff --git a/consolidated-00025-of-00272.safetensors b/consolidated-00025-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d6f041c41f8a2a830855328edd8f0a45df32628b --- /dev/null +++ b/consolidated-00025-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:685df140e4a256ed71461afd46b28479ac457f0fdc793edd78b4149a1c74ed7c +size 4991231064 diff --git a/consolidated-00026-of-00272.safetensors b/consolidated-00026-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ad7a517fbef4d4c28532fa952b47c0c2aabb4212 --- /dev/null +++ b/consolidated-00026-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f233eec802252172dcafce8703ecf2a4c5833be521f4952b316b512365b895f0 +size 4991230984 diff --git a/consolidated-00027-of-00272.safetensors b/consolidated-00027-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ef6ebc74d2f3e19eeac746884f5a1ac929334a83 --- /dev/null +++ b/consolidated-00027-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f106f41670d9db62b4d798ffcb74e63568c08561da6b8350e6e647319353540c +size 4991230984 diff --git a/consolidated-00028-of-00272.safetensors b/consolidated-00028-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9fa1494321375b20b5482478dcf24d2c85ccbb71 --- /dev/null +++ b/consolidated-00028-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3c82c4f787c7772d9aad195acb05fb6c5c0e98c438ff6b1842d6a633fe5e926 +size 4991230984 diff --git a/consolidated-00029-of-00272.safetensors b/consolidated-00029-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..205f5b56aee8ad876b5634e7a6869c81941ec227 --- /dev/null +++ b/consolidated-00029-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2566373a01235c7d6bb30d184f656b546961d26100bfe88773797ba45affcb8 +size 4956267904 diff --git a/consolidated-00030-of-00272.safetensors b/consolidated-00030-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b6d09f561edaee5338af5f627478aaf22b3a3fd2 --- /dev/null +++ b/consolidated-00030-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19da7a878bfcd71ced48ab4c9067c8400c0d40bfbb3341a57886d36ea0286024 +size 4991231032 diff --git a/consolidated-00031-of-00272.safetensors b/consolidated-00031-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b06efcaf647bd818430f008297e5ebcec6791aea --- /dev/null +++ b/consolidated-00031-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c8fee18f0c26e6c76b5a1a68f5054ee0ab59b812134c4d45906b2edec7f94b0 +size 4991230984 diff --git a/consolidated-00032-of-00272.safetensors b/consolidated-00032-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3ddb17eb5bd2302dce9406dcdab60a24219804a0 --- /dev/null +++ b/consolidated-00032-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c62250c662b7f5a6e54a26567dfe13b5885d0cc6d4b98a663e8dece85b280ca +size 4991230984 diff --git a/consolidated-00033-of-00272.safetensors b/consolidated-00033-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bb1ab845a19335b8b896e8b524462f44d95773ca --- /dev/null +++ b/consolidated-00033-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf7c44010b063e0c4e23bda1636e3f5e218d18e24860fca8d6a9c716f9cae953 +size 4956267856 diff --git a/consolidated-00034-of-00272.safetensors b/consolidated-00034-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8dd49ee59a5cb1e503732f6e615c0015b68af678 --- /dev/null +++ b/consolidated-00034-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0d1a3342fb3a44b94e1195103e23e80d00b51eb9e64eb3589c1d3e1d53d307e +size 4991231064 diff --git a/consolidated-00035-of-00272.safetensors b/consolidated-00035-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..128633f1704942836e00e3851d6104f152aa5ad0 --- /dev/null +++ b/consolidated-00035-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e58a569c98ee40513330f25ac5ba28dc8ad5d45564207067cb71e301870de6c7 +size 4991231000 diff --git a/consolidated-00036-of-00272.safetensors b/consolidated-00036-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1574cb1eb5ada539896b74e17fce0b0a782be6ee --- /dev/null +++ b/consolidated-00036-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1701fa4e09d02b5101b1c319b56b3859168ba3d9e2bb9c942d8edd78b581b34e +size 4991230984 diff --git a/consolidated-00037-of-00272.safetensors b/consolidated-00037-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6a28f3e9b1c6caac46f784907a6979e158158932 --- /dev/null +++ b/consolidated-00037-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3721aa8b49c273dd83fd665a1afa379555eb9da0b950cbf7106d8971d3fbdfc +size 4991230984 diff --git a/consolidated-00038-of-00272.safetensors b/consolidated-00038-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b9410f7bbc5c17d5d0a03460235aeffe7bc6425b --- /dev/null +++ b/consolidated-00038-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:270f0aa1946d42a930071f142930ddad9d32c501e5635b73725ddf506969fa03 +size 4956267880 diff --git a/consolidated-00039-of-00272.safetensors b/consolidated-00039-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e179ed5b450bf056ae47957a204ded55be17fecb --- /dev/null +++ b/consolidated-00039-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca7dfda133d0657e38378cb459a080a52d317514aee533fecb9c745d84cea16e +size 4991231056 diff --git a/consolidated-00040-of-00272.safetensors b/consolidated-00040-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d54d94ea0eed406e8eab9d32bd8cd84508af1446 --- /dev/null +++ b/consolidated-00040-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c10895692d0ce17458d37da53b4566a5da50ffe1f1ed5d7d56b728b45d3b56d +size 4991230984 diff --git a/consolidated-00041-of-00272.safetensors b/consolidated-00041-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6e4f54e1eee572e5cc9fbff2ee1531b221c35695 --- /dev/null +++ b/consolidated-00041-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a57f7d0371710878b27b1b508ec731ade0a906db3fc5b8b7eb545e6859027119 +size 4991230984 diff --git a/consolidated-00042-of-00272.safetensors b/consolidated-00042-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..31bc336477d9bfe9ecee9035b641487fc225f59c --- /dev/null +++ b/consolidated-00042-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cce788617f5a69dd37d92ad33d092e4c20d77cd171a32a7dc8a67edde9522881 +size 4991230984 diff --git a/consolidated-00043-of-00272.safetensors b/consolidated-00043-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0e5b267d1becbbefaa67e944b0c6142ef34df49b --- /dev/null +++ b/consolidated-00043-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b413bdd1d9e2d750ff62b2405211a07d88073a0191cd046742956217d37f2fb2 +size 4956267904 diff --git a/consolidated-00044-of-00272.safetensors b/consolidated-00044-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d3defee99214f85a87f1704a50eca027860ff629 --- /dev/null +++ b/consolidated-00044-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78dcf27fa15eaff66154e61d411ad8f9fc941bb9dd6c37ad5d2df0a928a17e3d +size 4991231024 diff --git a/consolidated-00045-of-00272.safetensors b/consolidated-00045-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..94178812db87c974a306df7f6e9e125e9a0a80e0 --- /dev/null +++ b/consolidated-00045-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4af300dcdcd96f0c9b50928643ebc37f70f81e91dbb98abf48ab49e7579f912d +size 4991230984 diff --git a/consolidated-00046-of-00272.safetensors b/consolidated-00046-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a8e5c8a799d051a57516ec6e2b386308d1f9c1d6 --- /dev/null +++ b/consolidated-00046-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b20dc5770c95bfc8cd2d8e0fede4476d0c9ef655a33e7694926065a98f49f76d +size 4991230984 diff --git a/consolidated-00047-of-00272.safetensors b/consolidated-00047-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..db45b1153e84ef667cb4dd96d8514541e49d9865 --- /dev/null +++ b/consolidated-00047-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b24116038ff730af2ac07ce2da4bf21c29ad4712c7980d18c17667526746b3f1 +size 4838826472 diff --git a/consolidated-00048-of-00272.safetensors b/consolidated-00048-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d4c838c2e68f3d0a7f569513f4699eb170bc9c06 --- /dev/null +++ b/consolidated-00048-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af51dc15f7a14a4b647d22b73d383fc2295b237f52a2115156ad98d58686f65f +size 4954432480 diff --git a/consolidated-00049-of-00272.safetensors b/consolidated-00049-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cee06838a41408bc66102590364273d616ccf816 --- /dev/null +++ b/consolidated-00049-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5c5cfcda51ea07f2febf4797fe39b08721efab1c06a4892137ada922e3a014f +size 4991231008 diff --git a/consolidated-00050-of-00272.safetensors b/consolidated-00050-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..411ec74a3cbb854c989b109e699a059b2915b35c --- /dev/null +++ b/consolidated-00050-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78e9224d869a6184a376ed6203d277dbd92f2a1643c8178c76c0e04338237b0b +size 4991230984 diff --git a/consolidated-00051-of-00272.safetensors b/consolidated-00051-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b015d346f6bc99910be8ab9d49a3eb78a5fc845d --- /dev/null +++ b/consolidated-00051-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67cf79db5f6d79c5d1b6963eeb5a14a25ddd7d0a2135da32b7645231f0a80181 +size 4991230984 diff --git a/consolidated-00052-of-00272.safetensors b/consolidated-00052-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1f1221efe9152ceb531cb290aa695eed02586e4f --- /dev/null +++ b/consolidated-00052-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ddc76b66fc72851eb288369d1c5cb3f210d6cd12ab7a52df17e274b1cfaacf0 +size 4956267872 diff --git a/consolidated-00053-of-00272.safetensors b/consolidated-00053-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..084720067275b6296c7ecd6bc75e9e2c23b60244 --- /dev/null +++ b/consolidated-00053-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcbbb016dbe5b6675f19cc59de1537ae27814e3ce14c59c782a7995e8ec413e8 +size 4991231064 diff --git a/consolidated-00054-of-00272.safetensors b/consolidated-00054-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d123480716392ace452efd1db0e0bcb18ba932f0 --- /dev/null +++ b/consolidated-00054-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0378966c5a4a4a9993078613b872bdf04002057bc4d641d520b37bd1b1eb811 +size 4991230984 diff --git a/consolidated-00055-of-00272.safetensors b/consolidated-00055-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4eb73471d0f6c750ed7997150b62bc17dcf84bcf --- /dev/null +++ b/consolidated-00055-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:475a152c46eb90b2c75d5edb77288120415d10711d5a3d4a42b20a5e885cde5b +size 4991230984 diff --git a/consolidated-00056-of-00272.safetensors b/consolidated-00056-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..00d0257720090516eca921d0648a4faf701c2212 --- /dev/null +++ b/consolidated-00056-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42e339ae8c59b37d357d2742aa288f0b62bffadde3f9aff8c7d6b0f859ec4dfb +size 4991230984 diff --git a/consolidated-00057-of-00272.safetensors b/consolidated-00057-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7fd3b1366df042fea0daabafb8bf712041370749 --- /dev/null +++ b/consolidated-00057-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f496247e7e776094886d176ae41db529a6c45fc0d263fb2ff4d25634e3ddb1f7 +size 4956267896 diff --git a/consolidated-00058-of-00272.safetensors b/consolidated-00058-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..91712ce967d30ca929cc402fd45e09beb393be8e --- /dev/null +++ b/consolidated-00058-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3abd59d05bc2d10167924ce30c7ef20379b2114745f38dd7d179d1af82b090d9 +size 4991231032 diff --git a/consolidated-00059-of-00272.safetensors b/consolidated-00059-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cc8675c2b2821f9a65f06e3e656cdb7bff88c025 --- /dev/null +++ b/consolidated-00059-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b81ab0921a6374b2af34adc85c54552cce6a462242849c34b340dd16e6ac110c +size 4991230984 diff --git a/consolidated-00060-of-00272.safetensors b/consolidated-00060-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e1bd687ead974d277cd0c7f8fdb48313c29e2781 --- /dev/null +++ b/consolidated-00060-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d730d5a7c7a0c610499877dd3e705a3270c0dcc856f47f267cda05b8760984a +size 4991230984 diff --git a/consolidated-00061-of-00272.safetensors b/consolidated-00061-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0df01465ad55c23108f338a4c4bb626cb914b665 --- /dev/null +++ b/consolidated-00061-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de171b4aed7a3dbd7e68e4320147c1d0c85b487df613a7d3fe46a372f2c26f8c +size 4800015592 diff --git a/consolidated-00062-of-00272.safetensors b/consolidated-00062-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f770ce6a33ef7755dc7b1d4abf0ad5368a77ef19 --- /dev/null +++ b/consolidated-00062-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2e9d9a107fd14ba0cd8c65979cb9d64e840c5de8a74159628dc05b656c6982e +size 4971322232 diff --git a/consolidated-00063-of-00272.safetensors b/consolidated-00063-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5b27a00c4b52c035a3e70cced9ef6ba988264047 --- /dev/null +++ b/consolidated-00063-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d60b23754cf50b694559d01af3cb5fb6a4e6efe79d791bc2845027e4092ee00 +size 4991231008 diff --git a/consolidated-00064-of-00272.safetensors b/consolidated-00064-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..30fbf37082eaac44bd63dd62b600cc0a27b16949 --- /dev/null +++ b/consolidated-00064-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c36f3a71393f7d6f9d63a3bb5da40136d050c888bf15d33f1c63714ce503e4a +size 4991230984 diff --git a/consolidated-00065-of-00272.safetensors b/consolidated-00065-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0fa459838c5c45d15e89f617c7bcf2def95333c4 --- /dev/null +++ b/consolidated-00065-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:854f12e79c0a32049d632965fd809db4bcf0980d1cce0a0d7b1ac18a0d50578b +size 4991230984 diff --git a/consolidated-00066-of-00272.safetensors b/consolidated-00066-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..003e82edb68cb1ed142d846c6741d3c3d49964c3 --- /dev/null +++ b/consolidated-00066-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81aad864a5b53eb74b06e6980993d7440b7dfb5d71ae4c03f04e5dbf46c4ba85 +size 4956267872 diff --git a/consolidated-00067-of-00272.safetensors b/consolidated-00067-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cf74f48b43b7a32be4c63182d5f943fb534a93b7 --- /dev/null +++ b/consolidated-00067-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e8f4e6a723dbce87f5c011c0343b0c6764eb3315d60bba8ecaa71798ac24c05 +size 4991231064 diff --git a/consolidated-00068-of-00272.safetensors b/consolidated-00068-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..696fbeeceb6e84f7bc588d05193a14d127f5e3a9 --- /dev/null +++ b/consolidated-00068-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5932f757b5e577f4eb8fc85cc161e349f3559cbc2b5c0d0d3210d95741653d3d +size 4991230984 diff --git a/consolidated-00069-of-00272.safetensors b/consolidated-00069-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a81e6373630c1cabefd5a5b22e7dd3eb22adac08 --- /dev/null +++ b/consolidated-00069-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71f4efa6e433da56b0721b85574ee1389f3ebcb1b665812cdf0c5793dad0f58e +size 4991230984 diff --git a/consolidated-00070-of-00272.safetensors b/consolidated-00070-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3c7fd1773732b53abf5fedfda129ee30cca2009b --- /dev/null +++ b/consolidated-00070-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:984de1b71cee682820c60151a6cfbf00c39ee873e282a30c0784c7c75e7b8b78 +size 4991230984 diff --git a/consolidated-00071-of-00272.safetensors b/consolidated-00071-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..20bef65b2b6713250cb942fb606a364f34e6dcda --- /dev/null +++ b/consolidated-00071-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f9a2f40da601e2852072bc64d632f7411a77e147a29d753c99aecde685eb9be +size 4956267904 diff --git a/consolidated-00072-of-00272.safetensors b/consolidated-00072-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e8c4778df64f0b96c569fd90bffee8fe5ce80d7e --- /dev/null +++ b/consolidated-00072-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3647013675437bb1d992b72743ffc340de2a4504f2763e1c4228f7a72080ef26 +size 4991231032 diff --git a/consolidated-00073-of-00272.safetensors b/consolidated-00073-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a2e92f34da4c948ade12428ec806da4f6684b4b0 --- /dev/null +++ b/consolidated-00073-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bc016f2f1c0cb6c8569b9fa35598d797653af7de87d573b424f72b3871e485a +size 4991230984 diff --git a/consolidated-00074-of-00272.safetensors b/consolidated-00074-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a2c0701eb7e97b1230ffda7e2099392427cc0742 --- /dev/null +++ b/consolidated-00074-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe129174bed917ccc4f1de9a0e8ca31247569be07b79e3c47a0c858b295828d7 +size 4991230984 diff --git a/consolidated-00075-of-00272.safetensors b/consolidated-00075-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b9c826985e0ae798e8f43456a56fe0d6c1c45776 --- /dev/null +++ b/consolidated-00075-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fc2f51556b8e4a7e6ac0e17bc2013952c770eddaec7c4293283d029fe58b4df +size 4956267856 diff --git a/consolidated-00076-of-00272.safetensors b/consolidated-00076-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..97895a69402cbc0e53bab2f406b4bbe1651f26a3 --- /dev/null +++ b/consolidated-00076-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da921d932ba670b0c802e64945dfd505739df1fb00b4981ac796ed1ecb0d4d35 +size 4991231064 diff --git a/consolidated-00077-of-00272.safetensors b/consolidated-00077-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e9f1800122d4415becea78e0c4a27d7c57cea2d7 --- /dev/null +++ b/consolidated-00077-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fd448ddf742dea3ebdd1b519d2b75b6461f3be86b362fffc26da3c7f215745b +size 4991231000 diff --git a/consolidated-00078-of-00272.safetensors b/consolidated-00078-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a60e7713d6f3610d4272bcfc7dd4b941af27c859 --- /dev/null +++ b/consolidated-00078-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93740858847285d19aaca15bc07e83bb533c2764ebf5b0a596d9ac1c011715c3 +size 4991230984 diff --git a/consolidated-00079-of-00272.safetensors b/consolidated-00079-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a89d7009c534205e572e68183215387335bb2fa0 --- /dev/null +++ b/consolidated-00079-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23de7e6978f9f39f3cfcb16a61ff7a9a518e477fcf51a907dddd4c68b36997d9 +size 4991230984 diff --git a/consolidated-00080-of-00272.safetensors b/consolidated-00080-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..34e3c4042cb8dd1f751d2e67359bec5ae58b9a18 --- /dev/null +++ b/consolidated-00080-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:541998a99177a7cb6ed5c6c3aa056a0356b3a487890eee5606f5de4897d9e4cc +size 4956267880 diff --git a/consolidated-00081-of-00272.safetensors b/consolidated-00081-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3a058f7d17b6c2b8ff2db52bbbade2f929a0832a --- /dev/null +++ b/consolidated-00081-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fa0f947f3a73abb1925b40201f0e81d90b601fc246cf902a4deab67a815d67d +size 4991231056 diff --git a/consolidated-00082-of-00272.safetensors b/consolidated-00082-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9647eb430b120f59227f01614d7b3cdec2317fd8 --- /dev/null +++ b/consolidated-00082-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70ef3c7c69900ad487e499604648adc01e7d9ca0f4bc55847cc832f56dd8284f +size 4991230984 diff --git a/consolidated-00083-of-00272.safetensors b/consolidated-00083-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bf3e8526aa7bad8510218a6b86cbadd0524b9232 --- /dev/null +++ b/consolidated-00083-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b13fc7ed72c50bba558b242fbddf882b729c6355adce6ad0760205d5511efb90 +size 4991230984 diff --git a/consolidated-00084-of-00272.safetensors b/consolidated-00084-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7ba4492b7d5b2d449ee01454e78dddecc176e164 --- /dev/null +++ b/consolidated-00084-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7ead4552002679f06b5506a0ed5a0c8a5d586873bce95aedeb9bbc8f3d22d90 +size 4991230984 diff --git a/consolidated-00085-of-00272.safetensors b/consolidated-00085-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7abe92753b6984a21d07bd9f87d34f62be0b2e8f --- /dev/null +++ b/consolidated-00085-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67f0ed20e6c42a71e79e15870a1adce0e14baee14ec33d7cb7909d6051f5a15c +size 4956267904 diff --git a/consolidated-00086-of-00272.safetensors b/consolidated-00086-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6d01985921e09fadf571e4ab3bf735799b6f0ec7 --- /dev/null +++ b/consolidated-00086-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5e9806461c0f51effc8dd7bccec4ef937c9b2375cbe2383778c0e6e0c745f17 +size 4991231024 diff --git a/consolidated-00087-of-00272.safetensors b/consolidated-00087-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..13f514a3bc1fa3287bab15874d10183a1fa4a889 --- /dev/null +++ b/consolidated-00087-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d3ae2eeb38f34bfdfdc98426b3f575754fe5543f29a03837e200bb80a74ec05 +size 4991230984 diff --git a/consolidated-00088-of-00272.safetensors b/consolidated-00088-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b4130bf2f8eee76559f3457da81615b3958ecd17 --- /dev/null +++ b/consolidated-00088-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:205298f9d16256493063540c831fb846381fe1f864f2e612a112869d07d3a219 +size 4991230984 diff --git a/consolidated-00089-of-00272.safetensors b/consolidated-00089-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bfa3d0d96bfba30e5136b12a7e8805bfc8064904 --- /dev/null +++ b/consolidated-00089-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa26311e28991a3e483bd1b0267923ec59c9ffc9f1e49f485eccaf5aec9e41de +size 4956267856 diff --git a/consolidated-00090-of-00272.safetensors b/consolidated-00090-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4830514bc60dc320adc1f953a507c02bbb139586 --- /dev/null +++ b/consolidated-00090-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8d110cdad866299454dbde797fc9f3489135640014a7a008eec677a42cba459 +size 4991231072 diff --git a/consolidated-00091-of-00272.safetensors b/consolidated-00091-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..551d40160f8f1c8ff175036c08279c8b2da7be3f --- /dev/null +++ b/consolidated-00091-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92575c14e24a9308fd6cae97e82d50291e57fd5747b7b428a7167b08fc609398 +size 4991230992 diff --git a/consolidated-00092-of-00272.safetensors b/consolidated-00092-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1200d234ff1956f84366381b66516e25456745b4 --- /dev/null +++ b/consolidated-00092-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2902dba09abb6e4a5b6c3f7a7fe620d49b45076000faa7921d2b97daffc3a3d1 +size 4991230984 diff --git a/consolidated-00093-of-00272.safetensors b/consolidated-00093-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..046d2019b3d1c2a390be7e73eb1eb69ccd39e42e --- /dev/null +++ b/consolidated-00093-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e771c880bee223e3cdfbc37c0bd1004c03768c4b408f424da5edb2ccf75253e +size 4991230984 diff --git a/consolidated-00094-of-00272.safetensors b/consolidated-00094-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c5121abea809365a270e646549c571f797d05ece --- /dev/null +++ b/consolidated-00094-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db0a46e1c8401ba690ba753606c43d5e98256c2c96552021c80ca3524a3ad0b8 +size 4956267840 diff --git a/consolidated-00095-of-00272.safetensors b/consolidated-00095-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e24c40924da7fdc44b2b27b0a3dd2d87f7a49b36 --- /dev/null +++ b/consolidated-00095-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2c9b08b343d05ba2f58bd68e2574d172cb5778dcbb37f908015215c09e6b6fe +size 4991230960 diff --git a/consolidated-00096-of-00272.safetensors b/consolidated-00096-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d3be733df3749fd615a26618d9076d19b5e409bc --- /dev/null +++ b/consolidated-00096-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bab696044e5e88876fb8535a9de12b1ca8bf09ad3e85be69494725065d96e8ba +size 4991230904 diff --git a/consolidated-00097-of-00272.safetensors b/consolidated-00097-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cceeff85bd18a0919db778acca24a04f251842f9 --- /dev/null +++ b/consolidated-00097-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ddd96a2ce6f3128a1fc147e9b307da02ed4c05e00c842832db9236cd0334a3b +size 4991230896 diff --git a/consolidated-00098-of-00272.safetensors b/consolidated-00098-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3f6f74b34f22ff282eac02bde512e5ff0d602d0c --- /dev/null +++ b/consolidated-00098-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ec98a2dd9761011b01aa6331267fc3fa79dd35f1f161214118f4eebeca03636 +size 4991230904 diff --git a/consolidated-00099-of-00272.safetensors b/consolidated-00099-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..69cd8abddf924ae908b4359087f9dcad31734676 --- /dev/null +++ b/consolidated-00099-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:072302faeb891b038394c5753ee64e922683459cdeb033200f188c69a02ce5a4 +size 4956267904 diff --git a/consolidated-00100-of-00272.safetensors b/consolidated-00100-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..da5d6286aec52f5988b4438c2c1845a5e1e22380 --- /dev/null +++ b/consolidated-00100-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3b8b71cd8206752c18a6388f1b6e5c2c2023e91b3819a60642eec3bebcbbde2 +size 4991231008 diff --git a/consolidated-00101-of-00272.safetensors b/consolidated-00101-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d8e2c87ecd1e3a12185ca5eeb2df701e6f42534e --- /dev/null +++ b/consolidated-00101-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01e32f4b550adf5be9e47f0d5ec54e07fb8ec30f963a73a5f4301f20f7ecfc33 +size 4991230984 diff --git a/consolidated-00102-of-00272.safetensors b/consolidated-00102-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f438a4dde305b6193628126ea4b0105233cc418c --- /dev/null +++ b/consolidated-00102-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28fac0502240cc526a0116db9c74baa6bc31f542463e15db24c878453ddcfa05 +size 4991230984 diff --git a/consolidated-00103-of-00272.safetensors b/consolidated-00103-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6fe9c043a9025880be31c7564bbb7f9d88b9c3f2 --- /dev/null +++ b/consolidated-00103-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14b0927a943c89ac0b2d215cd798b00de61918b2797c7eed062069538001b954 +size 4956267864 diff --git a/consolidated-00104-of-00272.safetensors b/consolidated-00104-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2971ab72244aadd10f437643efad84eec5b50a7a --- /dev/null +++ b/consolidated-00104-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0365d61482c1af67c5c0588689bfce392c8396d49829e7a1c6e3ce9703a1ecd9 +size 4991231064 diff --git a/consolidated-00105-of-00272.safetensors b/consolidated-00105-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bafda1a179bec5d838d6115eff22da74409e594c --- /dev/null +++ b/consolidated-00105-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e28d7caada24b9d0e23a7c253b4e5bdff8fab0b789ae4819d873cad67856025 +size 4991230984 diff --git a/consolidated-00106-of-00272.safetensors b/consolidated-00106-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..86438db32640f83c73dc771343295ab5bc5ebaf6 --- /dev/null +++ b/consolidated-00106-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d165496ab18532a1d00cdd86e45929cbfe867f4a771705af63d8a55294b529ea +size 4991230984 diff --git a/consolidated-00107-of-00272.safetensors b/consolidated-00107-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f95c0b7ca71fc2a6af43f0a64cb1cbcb3cbb0ed2 --- /dev/null +++ b/consolidated-00107-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fb9d0ae45f59b7aa0fdd39627870a042b4b39be351b09abcb0807704cb1887f +size 4991230984 diff --git a/consolidated-00108-of-00272.safetensors b/consolidated-00108-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7afb0ebadecbbf3600aaf6b454ccbd63e635cfc6 --- /dev/null +++ b/consolidated-00108-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aaedafc2f3646089e18a3fecacbc0cdfeb76ede0a43b214d68afb2d57caec435 +size 4956267896 diff --git a/consolidated-00109-of-00272.safetensors b/consolidated-00109-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7e2eb64191744f5448d03b6be67037091d78301d --- /dev/null +++ b/consolidated-00109-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8879663befbff94e5f71a5561bb68cf43ac9989d7b3e4b6cc8defdd02c39623 +size 4991231040 diff --git a/consolidated-00110-of-00272.safetensors b/consolidated-00110-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3d5401ff2465d6d91a4ad534514579f13f664501 --- /dev/null +++ b/consolidated-00110-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48e5c8658b8d6f507a706caf8dbea3deb7833499bdefc54f8c9a7708c4329682 +size 4991230984 diff --git a/consolidated-00111-of-00272.safetensors b/consolidated-00111-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6247e09983fdca6c24bd7c08a813e7ef372e8c7d --- /dev/null +++ b/consolidated-00111-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e93f0a9164c4d3f8f6e087970bf717254a1765a3fc79ae8a4791c7dd7c6fd72f +size 4991230984 diff --git a/consolidated-00112-of-00272.safetensors b/consolidated-00112-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..55b3d953c23a0601aa3a3dfda40b06543815d1b3 --- /dev/null +++ b/consolidated-00112-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b28fe8f7efdf64b33eefcf7436c3b55e32316d117c0dccd60f501970c000cd9 +size 4917456320 diff --git a/consolidated-00113-of-00272.safetensors b/consolidated-00113-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..56158394af12090f1852018bd44fb610facc7c37 --- /dev/null +++ b/consolidated-00113-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6a14f47505864204eaec0caa886b06f2640c9583eb3b2558505aef03e53851b +size 4971322232 diff --git a/consolidated-00114-of-00272.safetensors b/consolidated-00114-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..53230c3fb4746659b4545fe30ad3839d99d23dbf --- /dev/null +++ b/consolidated-00114-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d23d279be6143a3e2f7f6c757cc2ad1cd6fc2040634dc4212569099d93b03d32 +size 4991231008 diff --git a/consolidated-00115-of-00272.safetensors b/consolidated-00115-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..161b4d1996842b3fd7d00c891e3dd2c77fd86757 --- /dev/null +++ b/consolidated-00115-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af3abed770d7f0d8a000857d20ff6639f1c1609b79053b95ce8f30d9ed629927 +size 4991230984 diff --git a/consolidated-00116-of-00272.safetensors b/consolidated-00116-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a62fd070fef159792b95cae067164caabe8a5b6d --- /dev/null +++ b/consolidated-00116-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6292d73e2b17346ca3b9acbf9799215808ed4748ab19c2faf13d754d07135f51 +size 4991230984 diff --git a/consolidated-00117-of-00272.safetensors b/consolidated-00117-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..79d01c26dd643604f52d1c108185d2c588dd3392 --- /dev/null +++ b/consolidated-00117-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fea075e517fa248fb0f5523a74a195db74eb697e452e35b9af44215b30722399 +size 4956267872 diff --git a/consolidated-00118-of-00272.safetensors b/consolidated-00118-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8fa6312087bf64321cef16a8ea4c8daf209c335b --- /dev/null +++ b/consolidated-00118-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:604c83d058249dd0ec9dc3c1152cfcbb39cd76e7b43e5e16138cbaf20369107d +size 4991231064 diff --git a/consolidated-00119-of-00272.safetensors b/consolidated-00119-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e4902fe6094d29313a6e0fdd950df18342e9b2a2 --- /dev/null +++ b/consolidated-00119-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44adfb9d9efb62d636b46f66fac3eae86ded4d25c2937ed3007494e5aafd4b82 +size 4991230984 diff --git a/consolidated-00120-of-00272.safetensors b/consolidated-00120-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..234e8e04785a847da7fea4de028d90d8fbc8756a --- /dev/null +++ b/consolidated-00120-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff7ecbdfff3e80de0a787682fa71d7545f48a6da0bfa396eff05c756ad3836ba +size 4991230984 diff --git a/consolidated-00121-of-00272.safetensors b/consolidated-00121-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0a8fc27d956185d442867b4aeb6431e0f3d7d83d --- /dev/null +++ b/consolidated-00121-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:185e96cb99a652f6f55fba16b02c040c6ad1a8ee6cb3566d8d9a2e5cc0972166 +size 4991230984 diff --git a/consolidated-00122-of-00272.safetensors b/consolidated-00122-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b0a45d4086cbbebdeda8bdb5b7487b281f5738cf --- /dev/null +++ b/consolidated-00122-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22b116bff3b259dc54503c9ebae944e2912c16c1aa8b7adaf8ec2bff0b06afdc +size 4956267904 diff --git a/consolidated-00123-of-00272.safetensors b/consolidated-00123-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8f91c5f4d7a63abb76bd23f10e91442fa177a938 --- /dev/null +++ b/consolidated-00123-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d77be941b44c1ec924fe9971ddadb1f15c0a588fdf483fd6decfb7a642cea87 +size 4991231032 diff --git a/consolidated-00124-of-00272.safetensors b/consolidated-00124-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..baf24585df0811fa1decd1ea98d03098df6b018a --- /dev/null +++ b/consolidated-00124-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac65ae853415d0777c3076526ff230350549e776cd8ca9dcd0eae9f0ab1c095b +size 4991230984 diff --git a/consolidated-00125-of-00272.safetensors b/consolidated-00125-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..447ca8e485acf5656b15dd1812166dc6cf161933 --- /dev/null +++ b/consolidated-00125-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b1dadc6b8a01441f67eaba60c66f2cb11f775c01302adfb3296cf082d095169 +size 4991230984 diff --git a/consolidated-00126-of-00272.safetensors b/consolidated-00126-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d21c1141384ababa36ebbed245ef5c6fef390ae1 --- /dev/null +++ b/consolidated-00126-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:505d3ab43a4b2973401d7d1a8aed5b27e512d716bbbcb6200bf0dfae52ce78fd +size 4956267856 diff --git a/consolidated-00127-of-00272.safetensors b/consolidated-00127-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7d6742c86814f6aaf8d2bc1febd29d87ffaec5b0 --- /dev/null +++ b/consolidated-00127-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10963128598873b13e02d937f1e89b04e2f5fac38d1feafd26dd6fb0d315820e +size 4991231064 diff --git a/consolidated-00128-of-00272.safetensors b/consolidated-00128-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..22aebd133cdef2d85f58cd4b1e22970620560776 --- /dev/null +++ b/consolidated-00128-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb9c6bcd7d562cedfb8d3b8306cf03e7df68d7711f7ab12c87acf5e4ff410dc3 +size 4991231000 diff --git a/consolidated-00129-of-00272.safetensors b/consolidated-00129-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4aad678620215ad3a7aaa6f8c886437e10906478 --- /dev/null +++ b/consolidated-00129-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b75aa0c5c8e322b03e7df78d000803b62be9e78e80371375429be71b4eba71d +size 4991230984 diff --git a/consolidated-00130-of-00272.safetensors b/consolidated-00130-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..97d98c04be8d3774d58be95877acde97b074d0c2 --- /dev/null +++ b/consolidated-00130-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e45808356ca699a51bb0e272e79bcad3b18bd77934bcd1f6612c2200db863be7 +size 4991230984 diff --git a/consolidated-00131-of-00272.safetensors b/consolidated-00131-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ea94fa448128d13e600fb21e5c2331c352193936 --- /dev/null +++ b/consolidated-00131-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46f631f882474530ea5a366b5280e255e3e3ea104c6493eaf8d43dbf4dce7b90 +size 4956267880 diff --git a/consolidated-00132-of-00272.safetensors b/consolidated-00132-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..71bc1f4a0c1ec4e031ebd3259537555950515067 --- /dev/null +++ b/consolidated-00132-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3ba8956b5f6e03ef021003d9b1f2cbd0ccfacf13250ef630faa346f5980cbbb +size 4991231056 diff --git a/consolidated-00133-of-00272.safetensors b/consolidated-00133-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5235cda338d9dc259d70ebbc41f12423fc80a709 --- /dev/null +++ b/consolidated-00133-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:362bf4f64c9f14e3473b83ebe2dc66e42d16f8402c5883de4efce5c1b1120265 +size 4991230984 diff --git a/consolidated-00134-of-00272.safetensors b/consolidated-00134-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bb7f0a95fa2fb111f265725351b9450b6fdab640 --- /dev/null +++ b/consolidated-00134-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fdf8b956a6bbe2e991342614a6c43c01b99ebcb3b0280d50a80893ccf6ab593 +size 4991230984 diff --git a/consolidated-00135-of-00272.safetensors b/consolidated-00135-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..62b0e4942b7ae6579a194f6c03038753fe74f7f8 --- /dev/null +++ b/consolidated-00135-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0b716a7ee8f9b4a9383df564ad7cd8d9a3d413c51e3c970b938897fc0f985f2 +size 4991230984 diff --git a/consolidated-00136-of-00272.safetensors b/consolidated-00136-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..77e7d490cac1d2d1ff9fb256797f690e3b02901c --- /dev/null +++ b/consolidated-00136-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:519bc39baf4055ef5444d14c21a94ba342cbf254d151ae1295fb71d3cd080bc8 +size 4956267904 diff --git a/consolidated-00137-of-00272.safetensors b/consolidated-00137-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..abc62c2f84d21cb603fb0c0615a94a24be30338e --- /dev/null +++ b/consolidated-00137-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:114c67692f52414a2f9b97205be27b7cde5cc43e96a9c5c6b04c05ed4f489fba +size 4991231024 diff --git a/consolidated-00138-of-00272.safetensors b/consolidated-00138-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7095ed98fe6bef5821f9afd2959415ce5e58bad7 --- /dev/null +++ b/consolidated-00138-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a103457d4e2c0e0745c41c81be9569a1201de315068ee8ba4def14a7c506c7c4 +size 4991230984 diff --git a/consolidated-00139-of-00272.safetensors b/consolidated-00139-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..aa784458235a4fc9137eef6ae5abcb2cbf37ae50 --- /dev/null +++ b/consolidated-00139-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5db679c1d7613f7ed9dd54384959399328c7ab885330eeef81011ffac2f5dd7b +size 4991230984 diff --git a/consolidated-00140-of-00272.safetensors b/consolidated-00140-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..52acd81073bd6d8c63d1c3fe8d1873866208d216 --- /dev/null +++ b/consolidated-00140-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffdc470732657da906521d7cca2764b792d65ceaa403e002b5e4cc60cc7f9bab +size 4956267856 diff --git a/consolidated-00141-of-00272.safetensors b/consolidated-00141-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a46c86d87afebf4e49c5e2427350313d01002206 --- /dev/null +++ b/consolidated-00141-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:173667290837e32789a5bc38e33aba4ea6b062e9fe59feb4f73f4da07cd3cf1c +size 4991231072 diff --git a/consolidated-00142-of-00272.safetensors b/consolidated-00142-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d0c4399fcbf329fd6b2d60513ac8823e61552b7b --- /dev/null +++ b/consolidated-00142-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:278ea887337c50c5f6e48e76403663bc784dc89ab9552603dc8b14eb212f6775 +size 4991230992 diff --git a/consolidated-00143-of-00272.safetensors b/consolidated-00143-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f8282494fc58b1de974432385c8beb1e121906d9 --- /dev/null +++ b/consolidated-00143-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6d9fb4c337f3782b6b45b97b03d2adb98c55df6ea12a4c07a689cb370dc8b83 +size 4991230984 diff --git a/consolidated-00144-of-00272.safetensors b/consolidated-00144-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..efef3ff77a2345569b1ddad71d02da5a6c1f43a2 --- /dev/null +++ b/consolidated-00144-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b9e176eda125a2d8dcb14ce13bd910443816c40e2ecf63472b661a91500ca64 +size 4991230984 diff --git a/consolidated-00145-of-00272.safetensors b/consolidated-00145-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dbb36a986c7b4987ea4c746042a3ff92c0ebe89a --- /dev/null +++ b/consolidated-00145-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8ef84414c4b95a0f14c3c54d75bcc5dde480a7e907bcb32a79e5bb29c7052cc +size 4956267840 diff --git a/consolidated-00146-of-00272.safetensors b/consolidated-00146-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e5d529be5aa34d6c3381536340d4a19ee0af8ba3 --- /dev/null +++ b/consolidated-00146-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4d77e31357b4f3b8744781f288cc49566280546f78934e0823ba1760ae655f8 +size 4991230960 diff --git a/consolidated-00147-of-00272.safetensors b/consolidated-00147-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7fe993ba3a93771731f1e8eab4d6f21cc0beda6b --- /dev/null +++ b/consolidated-00147-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04bb36a76766e6a7495fdf35d753763463b31c80ce15473c96c53172f5ce42f2 +size 4991230904 diff --git a/consolidated-00148-of-00272.safetensors b/consolidated-00148-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9bd8a3516b7ab0d977c6a6f207c159f02cbd5682 --- /dev/null +++ b/consolidated-00148-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd7b4258bf73b92a4dbae0adde01c3f6b51fff8d5a9a8881a5002b6edac40121 +size 4991230896 diff --git a/consolidated-00149-of-00272.safetensors b/consolidated-00149-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8dc15cb230b4c8b49f6c27cd958838f996a1b6d4 --- /dev/null +++ b/consolidated-00149-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17094287409066ecbafd0633f854755286086116ef8b6bbc36602b54bbf13cff +size 4991230904 diff --git a/consolidated-00150-of-00272.safetensors b/consolidated-00150-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..81dbb4c9679603cff85eb96a54d2331f506dd8e2 --- /dev/null +++ b/consolidated-00150-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:feebc9894e3b44fb4003869e1b1b53c6a16856e5bf59087886f74343abf75840 +size 4956267904 diff --git a/consolidated-00151-of-00272.safetensors b/consolidated-00151-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6236e2461b7eae1196bc03918db13b5faefb7b17 --- /dev/null +++ b/consolidated-00151-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40b9f16e7ac117dfd765b3eaec87008f7f76aa027ce3d7889705da96b34528ff +size 4991231008 diff --git a/consolidated-00152-of-00272.safetensors b/consolidated-00152-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2624642d8bfabb8cf4d62bff23dfdcd138418d8c --- /dev/null +++ b/consolidated-00152-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9986eb5a58803ff177a462cfc6c53c16b499b2faef8558331d967f367c53a1fb +size 4991230984 diff --git a/consolidated-00153-of-00272.safetensors b/consolidated-00153-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e9d84ab3983dfa9739967a6ff045bd08f7b9c491 --- /dev/null +++ b/consolidated-00153-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:907a1dc029ead781f5d4966db68090d1f251f03a40c6000944d0035347a67baa +size 4991230984 diff --git a/consolidated-00154-of-00272.safetensors b/consolidated-00154-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..71efa025cb7ef5da45a59cbe437e3a38748d3e73 --- /dev/null +++ b/consolidated-00154-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6c44f0424b702f9865da23eec518cb916ea25d618b0980f902f7a111333f5cd +size 4956267864 diff --git a/consolidated-00155-of-00272.safetensors b/consolidated-00155-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ca9f00046b2c88e2f485d22ffa3c6ee0d2a6f351 --- /dev/null +++ b/consolidated-00155-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c18ca6dad16215273d0ca179c2f54af6f82b2c63e842e0fd4c79d756f94813c +size 4991231064 diff --git a/consolidated-00156-of-00272.safetensors b/consolidated-00156-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2a683933ae718ee7b1c3d74b99a86bbd630f61a2 --- /dev/null +++ b/consolidated-00156-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2192e12025bc9c71981ab25034514c9551ea0d3705510b3329ccc75fcea0c498 +size 4991230984 diff --git a/consolidated-00157-of-00272.safetensors b/consolidated-00157-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..58dacbb9b0d01c219c3e75d0279abb72e41083f1 --- /dev/null +++ b/consolidated-00157-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:881e6e978a127d7586db0e5e55317edac508f6e4d4f2e6b3fc7c5288f5e2dded +size 4991230984 diff --git a/consolidated-00158-of-00272.safetensors b/consolidated-00158-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..52233211552ba6cd109769a9938b46d050d4faa5 --- /dev/null +++ b/consolidated-00158-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70895fdd7e7fb09619257bd3cf5f1d9be662e6bc0e88224020c8c707a1696140 +size 4991230984 diff --git a/consolidated-00159-of-00272.safetensors b/consolidated-00159-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..37012ad691d14aba6b01d14bbbed56803ee8ff09 --- /dev/null +++ b/consolidated-00159-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98631ba1f6ab73019fd383444d58de7df652f93b1f1947de56a45eea9193d7c1 +size 4956267896 diff --git a/consolidated-00160-of-00272.safetensors b/consolidated-00160-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..31ce3747fb6efa0f398a747ed0c4c213915abe84 --- /dev/null +++ b/consolidated-00160-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd1176c75ac28eb1ade00b7bfb41d957163cbdb4bdb959172c2078a37e50d54c +size 4991231040 diff --git a/consolidated-00161-of-00272.safetensors b/consolidated-00161-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9ff32b5235b2e4dc379682c02edf3bbf83f8591d --- /dev/null +++ b/consolidated-00161-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55691e5a83cc06d017a7be0bebca8fd671996de83ded36d97d159f5c1e1e381d +size 4991230984 diff --git a/consolidated-00162-of-00272.safetensors b/consolidated-00162-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9736f1886d03b6aa2f14ccf768dd829eb410cfe7 --- /dev/null +++ b/consolidated-00162-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b9fe2aa22533b606d56bb2937a0c96dc8b7c71ce53bd6f529dd1c705669fd98 +size 4991230984 diff --git a/consolidated-00163-of-00272.safetensors b/consolidated-00163-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8a45a195c4a699e8c2bd1f1c1aee4f155ae76d51 --- /dev/null +++ b/consolidated-00163-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb2a3b8475cd2d613ec876c42ae89473b4896e888bbba447c24755e822f7053b +size 4917456320 diff --git a/consolidated-00164-of-00272.safetensors b/consolidated-00164-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dfe2d4c58dce18b623e2f8162aeb08ecdcfb769f --- /dev/null +++ b/consolidated-00164-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:477cde66908de77c6262ab320029159f922a80d780b01a372d7e9f4d1bb1ab17 +size 4971322232 diff --git a/consolidated-00165-of-00272.safetensors b/consolidated-00165-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f4af1da25d01ff311a8bf28e4b3dfd0a27d7f62e --- /dev/null +++ b/consolidated-00165-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60b4bf5039be0c29b726b7469c1e728c46280612a29992f0cb2a48000bae643a +size 4991231008 diff --git a/consolidated-00166-of-00272.safetensors b/consolidated-00166-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a7fec40c1c2ff97f719ccc1adce616faa18bbfb0 --- /dev/null +++ b/consolidated-00166-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80ff7229db681007479d382203b78783ecbfd6d97af1cfaacce30dd5ae186d39 +size 4991230984 diff --git a/consolidated-00167-of-00272.safetensors b/consolidated-00167-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c85130cf5e77f0195aa98b61ca434c2f29fc7c50 --- /dev/null +++ b/consolidated-00167-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67807b3b0795fedfbb20896590030c4d12e5facf4759dfedaaed470ecfdc61a5 +size 4991230984 diff --git a/consolidated-00168-of-00272.safetensors b/consolidated-00168-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b39a19814cc30c111fccf3fa8fbd68e913a91480 --- /dev/null +++ b/consolidated-00168-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbab1727fc9f87affb8c4b8c1de6e849fa3438914d91bf3afc5203d8c13e93bd +size 4956267872 diff --git a/consolidated-00169-of-00272.safetensors b/consolidated-00169-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dc3753b2cb9b3670af47f0acf7b2eba75022c146 --- /dev/null +++ b/consolidated-00169-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d25f764bfde1d4ccb42ac1ca428ea01b3471d72a2879cccfa4c74ed11271dce1 +size 4991231064 diff --git a/consolidated-00170-of-00272.safetensors b/consolidated-00170-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e2af73f1f262619ae9ed17ac01ea9a3a3d5298f0 --- /dev/null +++ b/consolidated-00170-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a161d6a767a2472cf5b6c59db488abc57f0fea139a54c18401c347f95d59b4e4 +size 4991230984 diff --git a/consolidated-00171-of-00272.safetensors b/consolidated-00171-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0ca9096a9c3d88eae664f913b9f025c6e23c4e29 --- /dev/null +++ b/consolidated-00171-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca312aa542425893b8c4e6a70136b34c998b6b2686381e37b2da3a5f43ef3edc +size 4991230984 diff --git a/consolidated-00172-of-00272.safetensors b/consolidated-00172-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..376e76afbf791b56d372198dd4efb9b3a3931a85 --- /dev/null +++ b/consolidated-00172-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:922ddc0e8c2f3f8a88051a411ee1c249aa7e6298a34d8a710a787b1653626cfb +size 4991230984 diff --git a/consolidated-00173-of-00272.safetensors b/consolidated-00173-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5eb33c0e023734774da00ef2924cb6ba1fe1bf9b --- /dev/null +++ b/consolidated-00173-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:591438c6ba127e4bc49d7e7e0bffe67f8f22dfe734f9d1cd673c2dd825ed7f48 +size 4956267904 diff --git a/consolidated-00174-of-00272.safetensors b/consolidated-00174-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3a764fc5919988b1cdefec5073251a5048590c12 --- /dev/null +++ b/consolidated-00174-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88537d959e84230825d50517210820050aafaf17ccde22c53524088196554809 +size 4991231032 diff --git a/consolidated-00175-of-00272.safetensors b/consolidated-00175-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9368c8f29ae23ef0b29139ee4c4902d05844515e --- /dev/null +++ b/consolidated-00175-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25b2e1e6521105e367dfd9a775f0b156f951dbefca08712338a8124f4978dc9e +size 4991230984 diff --git a/consolidated-00176-of-00272.safetensors b/consolidated-00176-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cd232885eb01c7ac2c6a81e20c5c3cec62e9691e --- /dev/null +++ b/consolidated-00176-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7308fdf1fa66d7361d0866be3c890151a32262381c351a858607cadd76f9141 +size 4991230984 diff --git a/consolidated-00177-of-00272.safetensors b/consolidated-00177-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6a305e4035965bfc92aabdd2ffbfe52ebc5f467c --- /dev/null +++ b/consolidated-00177-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee61682602969f559fce680f23e16ca90d0d7b1fe8ce9075317368596b818266 +size 4956267856 diff --git a/consolidated-00178-of-00272.safetensors b/consolidated-00178-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f10e5c359e3bcd55de04630d07e8ab3a67a1484a --- /dev/null +++ b/consolidated-00178-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67ae70805eb13dbb8c6bee723df28f22ed15560dd292a7f0d8d9151a650a8b69 +size 4991231064 diff --git a/consolidated-00179-of-00272.safetensors b/consolidated-00179-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..358658fece05053304d1d33c30bacc954ef31f79 --- /dev/null +++ b/consolidated-00179-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebfa4a2052fdfda86d70f4b3341d6e9d840f14737c2fcdeca5c0625cb525f60f +size 4991231000 diff --git a/consolidated-00180-of-00272.safetensors b/consolidated-00180-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6aa0767a09ddad108a5126a5ae547fd8ddd94cea --- /dev/null +++ b/consolidated-00180-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12321f88620b781fd03a01852f0a8b67fd9e7b63f60df3a145129c958b3ca377 +size 4991230984 diff --git a/consolidated-00181-of-00272.safetensors b/consolidated-00181-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..83de351cfcf0012bf1dc5a653ebd82ee792a8a96 --- /dev/null +++ b/consolidated-00181-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:526f602308dca2cf6847a7cb34af26715a67e41ad6e334ce4b5aa0f13d70fb2a +size 4991230984 diff --git a/consolidated-00182-of-00272.safetensors b/consolidated-00182-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0355370fae7957dabe6c1444ded526fa441d9eaa --- /dev/null +++ b/consolidated-00182-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:429e67260f74ddfb9892ca077724fb7ac0bb49fae518fd091f38a20e28e04f9c +size 4956267880 diff --git a/consolidated-00183-of-00272.safetensors b/consolidated-00183-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d47c1d408114a8085625a8c45d2d595a59403650 --- /dev/null +++ b/consolidated-00183-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03191cf4d052d9e25ff251bbfdbe7eb1585c857f5eb60501e13eddde8b54f6ea +size 4991231056 diff --git a/consolidated-00184-of-00272.safetensors b/consolidated-00184-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..22286206db87b4c0f6b71011cfbe4524b4c9285a --- /dev/null +++ b/consolidated-00184-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e019524d0be0f72346f70e5a9f6465b2d2e6140e72fb9bad7a67c65ba8821e96 +size 4991230984 diff --git a/consolidated-00185-of-00272.safetensors b/consolidated-00185-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fd4d8a04475d130afcb1dfa2e8307093071f3d29 --- /dev/null +++ b/consolidated-00185-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0555e3f6ad3896a5d2580f06b05a1f3d3ce03e11d0aa3c1f5f0864a84bae72df +size 4991230984 diff --git a/consolidated-00186-of-00272.safetensors b/consolidated-00186-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b9b3d5c9afff28cec9470e009b8ffcf6882950a9 --- /dev/null +++ b/consolidated-00186-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e8995176f92a5961247d7d349ad616d860c30ae2057979250e7b3c8dd1f79e6 +size 4991230984 diff --git a/consolidated-00187-of-00272.safetensors b/consolidated-00187-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d7f99d7467573f3da5946f2b136bcdac31f39a24 --- /dev/null +++ b/consolidated-00187-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:068c1aa3c716f40917766a576023d61d78376bf61ce3a5e4e685a4a55bce67cc +size 4956267904 diff --git a/consolidated-00188-of-00272.safetensors b/consolidated-00188-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f0c3dd579fec318e6a1d1a7323318e7fda1044d5 --- /dev/null +++ b/consolidated-00188-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:376ce368cc05488959de033f28527264fdde0acd63b931d3c74bf57c7cf4a073 +size 4991231024 diff --git a/consolidated-00189-of-00272.safetensors b/consolidated-00189-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..09e6a4adf78802ce40ce5dc059472db005792be8 --- /dev/null +++ b/consolidated-00189-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfbe8000c1d9e692de2d58737f57d6c92c6e2603f17be27bf5bb9c04f63963e0 +size 4991230984 diff --git a/consolidated-00190-of-00272.safetensors b/consolidated-00190-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8e77cfcea59398106dc0bdbca54f975ca0e4bd90 --- /dev/null +++ b/consolidated-00190-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:759537d4a3a85f6b6c3fcf25189e1389bb1d02e7b289f7f3396ab6d1c6bdcfd5 +size 4991230984 diff --git a/consolidated-00191-of-00272.safetensors b/consolidated-00191-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e5d8bba6197d98709c58d74ca2ad5157e849614b --- /dev/null +++ b/consolidated-00191-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:121a6150f2baf183731595ff4221b333c9ed041c4b7c3ec5ab8cfc601e225516 +size 4956267856 diff --git a/consolidated-00192-of-00272.safetensors b/consolidated-00192-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cf816d6c36b6f76d77a693232626f4ff8868dfec --- /dev/null +++ b/consolidated-00192-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06a64c7641b2562f6c60d715dd05bbe4c9ff33d8501e89f9da8d2bee55be8ee6 +size 4991231072 diff --git a/consolidated-00193-of-00272.safetensors b/consolidated-00193-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7f8676470946670d2f9268031d3f6fed745e8e73 --- /dev/null +++ b/consolidated-00193-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:257bee961c14ba89066e1de666f2b8842b72dfc86a29c80500171216692702c4 +size 4991230992 diff --git a/consolidated-00194-of-00272.safetensors b/consolidated-00194-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b0f20013d31918c82b5702c31a89d5f5ebc72fda --- /dev/null +++ b/consolidated-00194-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:897a21fc9402cb000a6b4453b63631fa84431a320a01d5a9a4b2935f1ed7f8a9 +size 4991230984 diff --git a/consolidated-00195-of-00272.safetensors b/consolidated-00195-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5182b9b2523bfd7ee156cc32e335b0f5e98ff6a4 --- /dev/null +++ b/consolidated-00195-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e402c64da74bcfd1d9224f75a85e0b4d686492b93644e691d9e3d7a24fa5fb0e +size 4991230984 diff --git a/consolidated-00196-of-00272.safetensors b/consolidated-00196-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4203050e0fb4fde10dbeef4c436bfbe87c2323bf --- /dev/null +++ b/consolidated-00196-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:842c6f53d6d4fc9839fcf14a792ba9c671f48a0e54a6bcfea3f8900552239f9f +size 4956267840 diff --git a/consolidated-00197-of-00272.safetensors b/consolidated-00197-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..be06643a88451d910f14ed057ea898df4c187ba5 --- /dev/null +++ b/consolidated-00197-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1756c04ee70068c0d094c40340e2c4c28705c4fc2c464d0bb066f78263ee027 +size 4991230960 diff --git a/consolidated-00198-of-00272.safetensors b/consolidated-00198-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6fc7dce94f6101af9a22d5677423b97870ce950d --- /dev/null +++ b/consolidated-00198-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:547596fc27e930dd4d906bac6886b02780a23392ae391924fd0b2f1f2412a221 +size 4991230904 diff --git a/consolidated-00199-of-00272.safetensors b/consolidated-00199-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..37e072761f4dfaefaaf00145462915b47166241a --- /dev/null +++ b/consolidated-00199-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a1513fb2aeacdec6bcbbe22eac9252c1e2816b352d6d955f245625bdb21663b +size 4991230896 diff --git a/consolidated-00200-of-00272.safetensors b/consolidated-00200-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..78be403c5b752b98f2230e51a5c6fe876e19555c --- /dev/null +++ b/consolidated-00200-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63b5fc6edd2387ed5462289f090ef8dd7ccc24ea21398355e6804713b65456d9 +size 4991230904 diff --git a/consolidated-00201-of-00272.safetensors b/consolidated-00201-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..70878ab9f540e21f5681fc2f2a0aeec774dac9d3 --- /dev/null +++ b/consolidated-00201-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e9d4d5ff3d019f6e655e3181ca09917293e8bf57d4f6f051f63fdbbd8921a02 +size 4956267904 diff --git a/consolidated-00202-of-00272.safetensors b/consolidated-00202-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b27e4a363348c17d74386691b9f49991623b3511 --- /dev/null +++ b/consolidated-00202-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ac651d848dba43dff9c61421af0db9f2f25c6a317b1b7e305e36421fd3ee5a7 +size 4991231008 diff --git a/consolidated-00203-of-00272.safetensors b/consolidated-00203-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c55344bdb80709f3fa6281d4dbce6b9bb88618d8 --- /dev/null +++ b/consolidated-00203-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a69e407b154db0a5ce922e742b2ddcbb94cf5b10312350d15790641a6640598 +size 4991230984 diff --git a/consolidated-00204-of-00272.safetensors b/consolidated-00204-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d46a0488a5a473a0057ff95d49e3c03464aa87fd --- /dev/null +++ b/consolidated-00204-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23375729e2b97fff2986b3a5bf3247b43a305c3a67098a6234afb0412e89e72e +size 4991230984 diff --git a/consolidated-00205-of-00272.safetensors b/consolidated-00205-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2315cdd769edc9c97e58fa6c924ccb6cbd622ef7 --- /dev/null +++ b/consolidated-00205-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b686c8197d06ea17e4c7dfaaa8d77c718a356b0c7e6cb6a7326b95d08fedbb31 +size 4956267864 diff --git a/consolidated-00206-of-00272.safetensors b/consolidated-00206-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3f8bcc222c9aae6404a804f1f6664fd742cfaea8 --- /dev/null +++ b/consolidated-00206-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03375e8009eb4e183031d065baa07e83b8308ee812582e72804955b937d520c5 +size 4991231064 diff --git a/consolidated-00207-of-00272.safetensors b/consolidated-00207-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5950916d73d8fd1d180cd27b33c82ecc262457e6 --- /dev/null +++ b/consolidated-00207-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac47327e31021ab044ba216093b0ea4d8b3af918647f94a1f1c92df0d746fc19 +size 4991230984 diff --git a/consolidated-00208-of-00272.safetensors b/consolidated-00208-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7158e9856752b65a82b8ec50d3804c1b9aa8fa4b --- /dev/null +++ b/consolidated-00208-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db93b147a766254f108fffe916a7b204323c56c0faf2fa5f8491a6e12981adaa +size 4991230984 diff --git a/consolidated-00209-of-00272.safetensors b/consolidated-00209-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c4ddc2ebd16124a713807b8b8229b757f0b142b5 --- /dev/null +++ b/consolidated-00209-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:068b3657b951c83d907e20552874c2b88044bcb2178b108527f0610d16df5931 +size 4991230984 diff --git a/consolidated-00210-of-00272.safetensors b/consolidated-00210-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..951752a59368eb26eb99f87c8ca90911bc4f7679 --- /dev/null +++ b/consolidated-00210-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04a2a221fd5e5b2ee17d6dd1f8eebc21462d3a038e259482ae1731602405dfea +size 4956267896 diff --git a/consolidated-00211-of-00272.safetensors b/consolidated-00211-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0b5c82f8bd1adaa4e3c555c50687fef63684cf39 --- /dev/null +++ b/consolidated-00211-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad29ab18633a3371f7b89c87082356cc9d1592dae87c446b55356d7de44a28f1 +size 4991231040 diff --git a/consolidated-00212-of-00272.safetensors b/consolidated-00212-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..815a38b5dbf954ee25a669c749a62fbab5846083 --- /dev/null +++ b/consolidated-00212-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5005e06f0ea0d401b96efd359e8448ea38321f0cdb5c215c50b937fa0b73640e +size 4991230984 diff --git a/consolidated-00213-of-00272.safetensors b/consolidated-00213-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..10b85622cc83be196ead4caf90f20c671777fb56 --- /dev/null +++ b/consolidated-00213-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc4e91ef4f54894b1c83234b64794b7d4049129aacc01e4f1b7f89e68e7b71b5 +size 4991230984 diff --git a/consolidated-00214-of-00272.safetensors b/consolidated-00214-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6e542157bac2cb9f85198b9b8f4be201687d9b4b --- /dev/null +++ b/consolidated-00214-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e28dd2ddb63c77effc205430196aea7eed68f4f2997fb3c22ba2076448c59f1f +size 4917456320 diff --git a/consolidated-00215-of-00272.safetensors b/consolidated-00215-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1aae15a3c9f5175b16562088fdc4aa9da54b63ac --- /dev/null +++ b/consolidated-00215-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18b53d3b20bd64a6b656d4d7a58b14e231476341f25e67a400c385a68d1cf235 +size 4971322232 diff --git a/consolidated-00216-of-00272.safetensors b/consolidated-00216-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d210fce6036cd8212c0bbfdc86a2f37491716b4b --- /dev/null +++ b/consolidated-00216-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ad409e0c7100512a33fe7858ce1bad6ac4d17c26196f6befffcf356971c54ad +size 4991231008 diff --git a/consolidated-00217-of-00272.safetensors b/consolidated-00217-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5f05c406c7bc00735d5a89ccd1bcf3b2639c8165 --- /dev/null +++ b/consolidated-00217-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:363800645ac444aeea0f8e149a1ff0d06f5366fcc1ce78d9a413dbebbd7138e4 +size 4991230984 diff --git a/consolidated-00218-of-00272.safetensors b/consolidated-00218-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..70b242dbc17c594c0a966a1277b29774f8ac69e9 --- /dev/null +++ b/consolidated-00218-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09bc4a00746de27bd32bb87b101411a009b7ca8752b5118d40d4cf6b928ecc3f +size 4991230984 diff --git a/consolidated-00219-of-00272.safetensors b/consolidated-00219-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4f97356d302c9543f4dbd360d9ef92b4f3e1f6fa --- /dev/null +++ b/consolidated-00219-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a03db350518045ac7aece71232555c80ff85388b21087ab68bfd458ebfcb87d +size 4956267872 diff --git a/consolidated-00220-of-00272.safetensors b/consolidated-00220-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..08f58c18001b90ab8a3adc7fa17b938e501abdba --- /dev/null +++ b/consolidated-00220-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fede185286f23b481599df7b4cd8112af622c33e768305fbfbaefa815bdc4175 +size 4991231064 diff --git a/consolidated-00221-of-00272.safetensors b/consolidated-00221-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0c1541e1b2a970ab81d399f20bd1b0a42af98e70 --- /dev/null +++ b/consolidated-00221-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af4a434568e81275ffe8a3fad216066cfe4900300c7e78dd114db64e167de02a +size 4991230984 diff --git a/consolidated-00222-of-00272.safetensors b/consolidated-00222-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f9e172313143a317d9d60949e7547b7d009f884d --- /dev/null +++ b/consolidated-00222-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a8a1b8039374edf86ad3f631574d894aad94f4d7b4f68e530c0695598dd1fe1 +size 4991230984 diff --git a/consolidated-00223-of-00272.safetensors b/consolidated-00223-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..057c45f3103d4ff7da167da3caccad8b37487c06 --- /dev/null +++ b/consolidated-00223-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caba6a240b4c5df2d965ee3948663d7f13b0e17b06cb87e90b35894eedca0c6a +size 4991230984 diff --git a/consolidated-00224-of-00272.safetensors b/consolidated-00224-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..764c9da68acfe5d8b10f6521a703c67f2bb0c108 --- /dev/null +++ b/consolidated-00224-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bfce8e10c23d6625c1cf01fb0f329f03b27e147060aa9740e9252470ce025e1 +size 4956267904 diff --git a/consolidated-00225-of-00272.safetensors b/consolidated-00225-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e5ea7e7d8c80f56c65dd224a33692cdf9b0580dc --- /dev/null +++ b/consolidated-00225-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c208a76afad8859bb7a9013e653e30f63feb8eb346a742aad40926c03bc2394d +size 4991231032 diff --git a/consolidated-00226-of-00272.safetensors b/consolidated-00226-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0dedb35b62877142b0197efa438abd1e397a3ad5 --- /dev/null +++ b/consolidated-00226-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f58985a0374e124f8bb5908394c6f9764182c2649354ca702708b1b3842c0fd +size 4991230984 diff --git a/consolidated-00227-of-00272.safetensors b/consolidated-00227-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a4a9c7165628d7c380a2a6a87eac1b84e2d1b360 --- /dev/null +++ b/consolidated-00227-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fceb0ebec798e8b8b641b03b8a3840e52e4e9c38211edc05209cb86c57b96109 +size 4991230984 diff --git a/consolidated-00228-of-00272.safetensors b/consolidated-00228-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2ac640dc4608063d2ea6ba0db62914f2b6df795f --- /dev/null +++ b/consolidated-00228-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73d06aabb4a529ba8c37e3beb9be68fc41378c07df3016515a955710cbce7367 +size 4956267856 diff --git a/consolidated-00229-of-00272.safetensors b/consolidated-00229-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e44c84d296e2debdf9bdcb898a9161f882e6f4e4 --- /dev/null +++ b/consolidated-00229-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fd6bc8286e4c862c33ecdb2ca888eeef3ce6e495dbfaf99b31111e6debeb640 +size 4991231064 diff --git a/consolidated-00230-of-00272.safetensors b/consolidated-00230-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..23b94e9d4a8ed831276dd8a323c4d0178c2f390c --- /dev/null +++ b/consolidated-00230-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56c65fa71f3fcac3bf8fb55205a0cb5827dd3c17cf15374ff022bbe058a75184 +size 4991231000 diff --git a/consolidated-00231-of-00272.safetensors b/consolidated-00231-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e1a8dbeb0a9c6496bf1b6cc3ac010752ce66d387 --- /dev/null +++ b/consolidated-00231-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd053eb66fa028f5745c46e1c5207253412068ac6cf2d8bcbb7951089d7ed514 +size 4991230984 diff --git a/consolidated-00232-of-00272.safetensors b/consolidated-00232-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d1219d77160311ae4df9b9714f7e09629062d6fb --- /dev/null +++ b/consolidated-00232-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df93b6793ff7ef5266574fa08643ade1f9a270d031d66eb70823754ef6dda3a9 +size 4991230984 diff --git a/consolidated-00233-of-00272.safetensors b/consolidated-00233-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6a57220bb681ea83a3217d75908225a5519499db --- /dev/null +++ b/consolidated-00233-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6864d6eff8d27d4a3e3a0875738f01f96dbb0736092fd01d5362ea65eb67e46 +size 4956267880 diff --git a/consolidated-00234-of-00272.safetensors b/consolidated-00234-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..81695bc87e545536c7aaee0714eaedcda0ffa08c --- /dev/null +++ b/consolidated-00234-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b07085ae8cbe14dd981e4047ec1ba401db4920a52d7691b43ea08c830dd3183 +size 4991231056 diff --git a/consolidated-00235-of-00272.safetensors b/consolidated-00235-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4d2019bd19a499c34955f5f1c430827d873a4932 --- /dev/null +++ b/consolidated-00235-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fe1ba1233bb3cee7f73e2c952e2f4ca688434fefe297d7e53542d4e17827e7e +size 4991230984 diff --git a/consolidated-00236-of-00272.safetensors b/consolidated-00236-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c686cd197a691a6efd641f77f432f9199abe97bb --- /dev/null +++ b/consolidated-00236-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f941a76685be7a9a73421b1765948fafa5997f0f3e9d4aa1f2eee459a060fb3 +size 4991230984 diff --git a/consolidated-00237-of-00272.safetensors b/consolidated-00237-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..29a8afd5aa6b0a0f15e25a882c99a6ec53352c45 --- /dev/null +++ b/consolidated-00237-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aef53d9fb3acd52b9bac02d2ceffec84cef5c73a23f0f3d5d4c6843d20e2e7b7 +size 4991230984 diff --git a/consolidated-00238-of-00272.safetensors b/consolidated-00238-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f6e1d542c41a77042faceba7bcc4c00974619c6e --- /dev/null +++ b/consolidated-00238-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c034f9dd1950f367a19dd80e89911df9536a11893f2330672e31df1be227395 +size 4956267904 diff --git a/consolidated-00239-of-00272.safetensors b/consolidated-00239-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f666fdb4eaf88c002f3cab993b0a22f591ffbd83 --- /dev/null +++ b/consolidated-00239-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a365b031e91a6ca32aebdf78854e93a592f5167ab3f2af191ac746302c9582a1 +size 4991231024 diff --git a/consolidated-00240-of-00272.safetensors b/consolidated-00240-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f7e359f3ce71a1b9688fc426dd1e9a24e9e1d568 --- /dev/null +++ b/consolidated-00240-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11edf29d1209d362fbe9001f04e12f3223cb7c7193409421e77d9cc9788d14a1 +size 4991230984 diff --git a/consolidated-00241-of-00272.safetensors b/consolidated-00241-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6e3a8071fe0b0379453c58b3fd63e9a860b0acab --- /dev/null +++ b/consolidated-00241-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b177ddef9e0dae0094401df4ba02f72028f50a225d9682d6e605c2b6a0bd59ca +size 4991230984 diff --git a/consolidated-00242-of-00272.safetensors b/consolidated-00242-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c9dfadec9f096ccf1f79ce5e11cd2cf29761e300 --- /dev/null +++ b/consolidated-00242-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09bec986251b80e3a058701046a480403e554e021c12dd44d8efea72c1137a1d +size 4956267856 diff --git a/consolidated-00243-of-00272.safetensors b/consolidated-00243-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..39335985a65387659c25c39d3c801626bba061cc --- /dev/null +++ b/consolidated-00243-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eacd4282509a03adf4c1abf4c8d5014a3bfed2fc3adb5677f4dd2e1b77195a21 +size 4991231072 diff --git a/consolidated-00244-of-00272.safetensors b/consolidated-00244-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d24fd4c95bed8c77cd1824f190f69fcf70e34b3b --- /dev/null +++ b/consolidated-00244-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b21b458309df60d42a637842f79bcb614ce830e0163e67305e7e6991384d3d48 +size 4991230992 diff --git a/consolidated-00245-of-00272.safetensors b/consolidated-00245-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6841acc84fd787dfc56a9dbe2472881b7fc3be8a --- /dev/null +++ b/consolidated-00245-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24c4f6981e5b8e3f6c30af4906b196a950bdfd38dddf304f51ea5120c2e84fe9 +size 4991230984 diff --git a/consolidated-00246-of-00272.safetensors b/consolidated-00246-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a2b8b6c28b0caa8c9ea6db498a6d03fea9e007b7 --- /dev/null +++ b/consolidated-00246-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0108aadb1ff97733214baef22cfeaaba693f648f8e7cc07f6f471503c650a2fa +size 4991230984 diff --git a/consolidated-00247-of-00272.safetensors b/consolidated-00247-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..887bdf117ad996eba482dd76c3e93183634f1022 --- /dev/null +++ b/consolidated-00247-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d715289816adf66af7b4b6d3b959e6f3bcde3ed9cd5e74e4c09a392d0ebc95ab +size 4956267840 diff --git a/consolidated-00248-of-00272.safetensors b/consolidated-00248-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f336232a0df4fe1536e232254f32772a6b13c0a8 --- /dev/null +++ b/consolidated-00248-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3013ff2ac1d9fc964d1f891a90f9a3df84d6d938b064c91d84c11bed52a84afc +size 4991230960 diff --git a/consolidated-00249-of-00272.safetensors b/consolidated-00249-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c9f7637a5c62760cfa86aeeff3d58eb2305e881a --- /dev/null +++ b/consolidated-00249-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c10b66848b5c65f260f34ff0612d9efb262c11f2190a00cc5541f1ca07f6affc +size 4991230904 diff --git a/consolidated-00250-of-00272.safetensors b/consolidated-00250-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2866302e917a446ae11df0fd30a62f224a6c3665 --- /dev/null +++ b/consolidated-00250-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe81f13005730dab2afef288d927fda82e37277d4ca52aa9b1c2f7361edb40ec +size 4991230896 diff --git a/consolidated-00251-of-00272.safetensors b/consolidated-00251-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..931cdf625dc33fc66d2a7bd53633642c5a599e4e --- /dev/null +++ b/consolidated-00251-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62272c2147b185eabebbd7daa7e11b43343a2f68756fd63269f01d4798f723d6 +size 4991230904 diff --git a/consolidated-00252-of-00272.safetensors b/consolidated-00252-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9decc4b53967ea75907e97356aadd546f385e01c --- /dev/null +++ b/consolidated-00252-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ac9bb89775a22e762ccbd02ae5aaf3005c1cef5f7a579a252f612fe1fffc540 +size 4956267904 diff --git a/consolidated-00253-of-00272.safetensors b/consolidated-00253-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..299d578f1b993d9703454cbfc857e86729089857 --- /dev/null +++ b/consolidated-00253-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efb691055ac12411466c9e37afee2e40ae0b858c0601265a28cdcd67f0ab7e65 +size 4991231008 diff --git a/consolidated-00254-of-00272.safetensors b/consolidated-00254-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..34e3e937b9d7a6240490855cf80130f57b716824 --- /dev/null +++ b/consolidated-00254-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7942483b2255c93d49d4588985db81f412956f7d52944fc6594cc8ecf4ab33ae +size 4991230984 diff --git a/consolidated-00255-of-00272.safetensors b/consolidated-00255-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1d9f0415d4b4cd19d79b6c18b339071e4bbd9e26 --- /dev/null +++ b/consolidated-00255-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73164f7e4d4b72585b7f34a5004c9009d59bca512513ea6532c36ed13e615414 +size 4991230984 diff --git a/consolidated-00256-of-00272.safetensors b/consolidated-00256-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6ef5b068c140b4d20b0a256a4beb73be254734cc --- /dev/null +++ b/consolidated-00256-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:352d19030ec728a06bcbca6c5e4c9f6f53bd98a5dec961575bff0150bb1570c1 +size 4956267840 diff --git a/consolidated-00257-of-00272.safetensors b/consolidated-00257-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a085201876686619506b50a256a5f82c574a8faa --- /dev/null +++ b/consolidated-00257-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:903937519c1c575c38310156ed460113edd4f91f25913f630be6da4907a1a1be +size 4991230984 diff --git a/consolidated-00258-of-00272.safetensors b/consolidated-00258-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..764f7a2a6348fa394db7c82b65574ac371de1a35 --- /dev/null +++ b/consolidated-00258-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cf4de262d5f7e7dc5bfc2a979d03d6eea85a8a3bd853175e40b742fe6fda819 +size 4991230896 diff --git a/consolidated-00259-of-00272.safetensors b/consolidated-00259-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5354999b8f91f66c247bbbbaa1bfef17cd94330c --- /dev/null +++ b/consolidated-00259-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f33a568a442ec1e8c09ce42649dbb57777bf12f7fa0c9789f6aba9fa98cdae6 +size 4991230904 diff --git a/consolidated-00260-of-00272.safetensors b/consolidated-00260-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a2dcb1b4c50e047160f0da58c5a94dfd8a1a0440 --- /dev/null +++ b/consolidated-00260-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:154c178487df78fdd6fe5c3d4ef4a1bd32f3d19a8cf62d5348162a78cef6026e +size 4991230896 diff --git a/consolidated-00261-of-00272.safetensors b/consolidated-00261-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..989ad7a6a764102cec677b8e0b732d44fb7d200a --- /dev/null +++ b/consolidated-00261-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:651e25f7e345d57482ef95044458790e9cfb9272987efb594f8391618fb20f2e +size 4956267808 diff --git a/consolidated-00262-of-00272.safetensors b/consolidated-00262-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3599e47b8766cf952b549356b11dd557583ee314 --- /dev/null +++ b/consolidated-00262-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7905013aa1e4b773563dee8db1476ba732fac62a908d3cc0477c5971e7654c27 +size 4991230952 diff --git a/consolidated-00263-of-00272.safetensors b/consolidated-00263-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bd727ebe8db46074524a3b327bcd25b17a82bb67 --- /dev/null +++ b/consolidated-00263-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d34aa008596d5d36b0c51a7c1c5efb0f14afff5af5c9ff473d76ca095a779094 +size 4991230904 diff --git a/consolidated-00264-of-00272.safetensors b/consolidated-00264-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e77803869941d4de1243e80fa0d4a4576076ac14 --- /dev/null +++ b/consolidated-00264-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3fb3803f98a305a2c162993446a9be82054c50ac0004a86878a37431f5f67d3 +size 4991230896 diff --git a/consolidated-00265-of-00272.safetensors b/consolidated-00265-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b8ab90eca118360c077dc50460590bc0c07d826c --- /dev/null +++ b/consolidated-00265-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a1e2081c0c986e68ab1970e8b24e07284708eced1bb7891c553a270e11e939c +size 4917456232 diff --git a/consolidated-00266-of-00272.safetensors b/consolidated-00266-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1e4ecc35bec74279a30da579c6cf6d62b3273ed3 --- /dev/null +++ b/consolidated-00266-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c0d500a878bcda7d1283f1db5fb59bd77ea5c7f209f496c14001cf876b6d129 +size 4971322144 diff --git a/consolidated-00267-of-00272.safetensors b/consolidated-00267-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f69c3bd18850c001abcc47e182b612bca3d1d26e --- /dev/null +++ b/consolidated-00267-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85af2107f1b4069df59049293ca2bc8fff2312258272d67fa4e3c6aa92c03619 +size 4991230920 diff --git a/consolidated-00268-of-00272.safetensors b/consolidated-00268-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b052197c429dc60764cb6e2fbee3f551b713e8c7 --- /dev/null +++ b/consolidated-00268-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5595ab63dbe3ad55ee3bc16cd92d3786e54f81fb67b489beb81f1aaf3948f66 +size 4991230904 diff --git a/consolidated-00269-of-00272.safetensors b/consolidated-00269-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0e23cf07b9930b2265ab1399c285e203398f0645 --- /dev/null +++ b/consolidated-00269-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e0631205ce6d97392620e5ede07733ce690065b14242e21f94f39c00bedc023 +size 4991230896 diff --git a/consolidated-00270-of-00272.safetensors b/consolidated-00270-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c8a4c5b606223e3571b210ef0c1f459287edf18d --- /dev/null +++ b/consolidated-00270-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b81d675fe3cb9e5a3c2ac2e6dd3a158db7603e5433d111f3cdcbc8ed4cd303a +size 3136183520 diff --git a/consolidated-00271-of-00272.safetensors b/consolidated-00271-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0a0fa67550e40eb792022ef4f89a71a9db6fefb3 --- /dev/null +++ b/consolidated-00271-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf75706c5dd3cbd1ae9b69ffdc749e1eac787ad611cfe69af44e4679076f7176 +size 4999447592 diff --git a/consolidated-00272-of-00272.safetensors b/consolidated-00272-of-00272.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7b8e7645aa1d3a5b5c584112b75af705b25a9bd9 --- /dev/null +++ b/consolidated-00272-of-00272.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:daf2a2bbaf9f8b756b1879b0c12ebcfda9d8057d675603dd379053d2053d34be +size 3876741776 diff --git a/consolidated.safetensors.index.json b/consolidated.safetensors.index.json new file mode 100644 index 0000000000000000000000000000000000000000..9dd8a56556ab5a67ee896dcdfaecb4738552b622 --- /dev/null +++ b/consolidated.safetensors.index.json @@ -0,0 +1,23510 @@ +{ + "metadata": { + "total_size": 1351982353920 + }, + "weight_map": { + "layers.0.attention.kv_a_norm.weight": "consolidated-00001-of-00272.safetensors", + "layers.0.attention.q_a_norm.weight": "consolidated-00001-of-00272.safetensors", + "layers.0.attention.wkv_a_with_mqa.weight": "consolidated-00001-of-00272.safetensors", + "layers.0.attention.wkv_b.weight": "consolidated-00001-of-00272.safetensors", + "layers.0.attention.wo.weight": "consolidated-00001-of-00272.safetensors", + "layers.0.attention.wq_a.weight": "consolidated-00001-of-00272.safetensors", + "layers.0.attention.wq_b.weight": "consolidated-00001-of-00272.safetensors", + "layers.0.attention_norm.weight": "consolidated-00001-of-00272.safetensors", + "layers.0.feed_forward.w1.weight": "consolidated-00001-of-00272.safetensors", + "layers.0.feed_forward.w2.weight": "consolidated-00001-of-00272.safetensors", + "layers.0.feed_forward.w3.weight": "consolidated-00001-of-00272.safetensors", + "layers.0.ffn_norm.weight": "consolidated-00001-of-00272.safetensors", + "layers.1.attention.kv_a_norm.weight": "consolidated-00001-of-00272.safetensors", + "layers.1.attention.q_a_norm.weight": "consolidated-00001-of-00272.safetensors", + "layers.1.attention.wkv_a_with_mqa.weight": "consolidated-00001-of-00272.safetensors", + "layers.1.attention.wkv_b.weight": "consolidated-00001-of-00272.safetensors", + "layers.1.attention.wo.weight": "consolidated-00001-of-00272.safetensors", + "layers.1.attention.wq_a.weight": "consolidated-00001-of-00272.safetensors", + "layers.1.attention.wq_b.weight": "consolidated-00001-of-00272.safetensors", + "layers.1.attention_norm.weight": "consolidated-00001-of-00272.safetensors", + "layers.1.feed_forward.w1.weight": "consolidated-00001-of-00272.safetensors", + "layers.1.feed_forward.w2.weight": "consolidated-00001-of-00272.safetensors", + "layers.1.feed_forward.w3.weight": "consolidated-00001-of-00272.safetensors", + "layers.1.ffn_norm.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.attention.kv_a_norm.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.attention.q_a_norm.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.attention.wkv_a_with_mqa.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.attention.wkv_b.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.attention.wo.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.attention.wq_a.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.attention.wq_b.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.attention_norm.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.0.w1.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.0.w2.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.0.w3.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.1.w1.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.1.w2.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.1.w3.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.10.w1.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.10.w2.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.10.w3.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.100.w1.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.100.w2.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.100.w3.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.101.w1.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.101.w2.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.101.w3.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.102.w1.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.102.w2.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.102.w3.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.103.w1.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.103.w2.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.103.w3.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.104.w1.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.104.w2.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.104.w3.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.105.w1.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.105.w2.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.105.w3.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.106.w1.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.106.w2.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.106.w3.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.107.w1.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.107.w2.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.107.w3.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.108.w1.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.108.w2.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.108.w3.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.109.w1.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.109.w2.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.109.w3.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.11.w1.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.11.w2.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.11.w3.weight": "consolidated-00001-of-00272.safetensors", + "layers.10.experts.110.w1.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.110.w2.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.110.w3.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.111.w1.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.111.w2.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.111.w3.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.112.w1.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.112.w2.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.112.w3.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.113.w1.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.113.w2.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.113.w3.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.114.w1.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.114.w2.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.114.w3.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.115.w1.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.115.w2.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.115.w3.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.116.w1.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.116.w2.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.116.w3.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.117.w1.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.117.w2.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.117.w3.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.118.w1.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.118.w2.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.118.w3.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.119.w1.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.119.w2.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.119.w3.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.12.w1.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.12.w2.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.12.w3.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.120.w1.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.120.w2.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.120.w3.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.121.w1.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.121.w2.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.121.w3.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.122.w1.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.122.w2.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.122.w3.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.123.w1.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.123.w2.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.123.w3.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.124.w1.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.124.w2.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.124.w3.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.125.w1.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.125.w2.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.125.w3.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.126.w1.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.126.w2.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.126.w3.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.127.w1.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.127.w2.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.127.w3.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.13.w1.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.13.w2.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.13.w3.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.14.w1.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.14.w2.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.14.w3.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.15.w1.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.15.w2.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.15.w3.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.16.w1.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.16.w2.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.16.w3.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.17.w1.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.17.w2.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.17.w3.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.18.w1.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.18.w2.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.18.w3.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.19.w1.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.19.w2.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.19.w3.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.2.w1.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.2.w2.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.2.w3.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.20.w1.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.20.w2.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.20.w3.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.21.w1.weight": "consolidated-00002-of-00272.safetensors", + "layers.10.experts.21.w2.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.21.w3.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.22.w1.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.22.w2.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.22.w3.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.23.w1.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.23.w2.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.23.w3.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.24.w1.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.24.w2.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.24.w3.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.25.w1.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.25.w2.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.25.w3.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.26.w1.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.26.w2.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.26.w3.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.27.w1.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.27.w2.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.27.w3.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.28.w1.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.28.w2.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.28.w3.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.29.w1.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.29.w2.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.29.w3.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.3.w1.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.3.w2.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.3.w3.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.30.w1.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.30.w2.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.30.w3.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.31.w1.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.31.w2.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.31.w3.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.32.w1.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.32.w2.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.32.w3.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.33.w1.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.33.w2.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.33.w3.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.34.w1.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.34.w2.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.34.w3.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.35.w1.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.35.w2.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.35.w3.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.36.w1.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.36.w2.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.36.w3.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.37.w1.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.37.w2.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.37.w3.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.38.w1.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.38.w2.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.38.w3.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.39.w1.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.39.w2.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.39.w3.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.4.w1.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.4.w2.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.4.w3.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.40.w1.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.40.w2.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.40.w3.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.41.w1.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.41.w2.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.41.w3.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.42.w1.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.42.w2.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.42.w3.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.43.w1.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.43.w2.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.43.w3.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.44.w1.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.44.w2.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.44.w3.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.45.w1.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.45.w2.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.45.w3.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.46.w1.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.46.w2.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.46.w3.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.47.w1.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.47.w2.weight": "consolidated-00003-of-00272.safetensors", + "layers.10.experts.47.w3.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.48.w1.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.48.w2.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.48.w3.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.49.w1.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.49.w2.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.49.w3.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.5.w1.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.5.w2.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.5.w3.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.50.w1.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.50.w2.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.50.w3.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.51.w1.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.51.w2.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.51.w3.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.52.w1.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.52.w2.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.52.w3.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.53.w1.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.53.w2.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.53.w3.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.54.w1.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.54.w2.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.54.w3.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.55.w1.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.55.w2.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.55.w3.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.56.w1.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.56.w2.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.56.w3.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.57.w1.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.57.w2.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.57.w3.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.58.w1.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.58.w2.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.58.w3.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.59.w1.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.59.w2.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.59.w3.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.6.w1.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.6.w2.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.6.w3.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.60.w1.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.60.w2.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.60.w3.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.61.w1.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.61.w2.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.61.w3.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.62.w1.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.62.w2.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.62.w3.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.63.w1.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.63.w2.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.63.w3.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.64.w1.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.64.w2.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.64.w3.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.65.w1.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.65.w2.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.65.w3.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.66.w1.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.66.w2.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.66.w3.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.67.w1.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.67.w2.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.67.w3.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.68.w1.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.68.w2.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.68.w3.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.69.w1.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.69.w2.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.69.w3.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.7.w1.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.7.w2.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.7.w3.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.70.w1.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.70.w2.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.70.w3.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.71.w1.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.71.w2.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.71.w3.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.72.w1.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.72.w2.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.72.w3.weight": "consolidated-00004-of-00272.safetensors", + "layers.10.experts.73.w1.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.73.w2.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.73.w3.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.74.w1.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.74.w2.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.74.w3.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.75.w1.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.75.w2.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.75.w3.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.76.w1.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.76.w2.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.76.w3.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.77.w1.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.77.w2.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.77.w3.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.78.w1.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.78.w2.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.78.w3.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.79.w1.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.79.w2.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.79.w3.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.8.w1.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.8.w2.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.8.w3.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.80.w1.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.80.w2.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.80.w3.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.81.w1.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.81.w2.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.81.w3.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.82.w1.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.82.w2.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.82.w3.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.83.w1.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.83.w2.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.83.w3.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.84.w1.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.84.w2.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.84.w3.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.85.w1.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.85.w2.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.85.w3.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.86.w1.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.86.w2.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.86.w3.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.87.w1.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.87.w2.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.87.w3.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.88.w1.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.88.w2.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.88.w3.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.89.w1.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.89.w2.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.89.w3.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.9.w1.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.9.w2.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.9.w3.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.90.w1.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.90.w2.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.90.w3.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.91.w1.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.91.w2.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.91.w3.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.92.w1.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.92.w2.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.92.w3.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.93.w1.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.93.w2.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.93.w3.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.94.w1.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.94.w2.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.94.w3.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.95.w1.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.95.w2.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.95.w3.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.96.w1.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.96.w2.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.96.w3.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.97.w1.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.97.w2.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.97.w3.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.98.w1.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.98.w2.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.98.w3.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.99.w1.weight": "consolidated-00005-of-00272.safetensors", + "layers.10.experts.99.w2.weight": "consolidated-00006-of-00272.safetensors", + "layers.10.experts.99.w3.weight": "consolidated-00006-of-00272.safetensors", + "layers.10.ffn_norm.weight": "consolidated-00006-of-00272.safetensors", + "layers.10.gate.weight": "consolidated-00006-of-00272.safetensors", + "layers.10.shared_experts.w1.weight": "consolidated-00006-of-00272.safetensors", + "layers.10.shared_experts.w2.weight": "consolidated-00006-of-00272.safetensors", + "layers.10.shared_experts.w3.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.attention.kv_a_norm.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.attention.q_a_norm.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.attention.wkv_a_with_mqa.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.attention.wkv_b.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.attention.wo.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.attention.wq_a.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.attention.wq_b.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.attention_norm.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.0.w1.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.0.w2.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.0.w3.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.1.w1.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.1.w2.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.1.w3.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.10.w1.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.10.w2.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.10.w3.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.100.w1.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.100.w2.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.100.w3.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.101.w1.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.101.w2.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.101.w3.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.102.w1.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.102.w2.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.102.w3.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.103.w1.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.103.w2.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.103.w3.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.104.w1.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.104.w2.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.104.w3.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.105.w1.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.105.w2.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.105.w3.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.106.w1.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.106.w2.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.106.w3.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.107.w1.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.107.w2.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.107.w3.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.108.w1.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.108.w2.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.108.w3.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.109.w1.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.109.w2.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.109.w3.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.11.w1.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.11.w2.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.11.w3.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.110.w1.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.110.w2.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.110.w3.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.111.w1.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.111.w2.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.111.w3.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.112.w1.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.112.w2.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.112.w3.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.113.w1.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.113.w2.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.113.w3.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.114.w1.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.114.w2.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.114.w3.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.115.w1.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.115.w2.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.115.w3.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.116.w1.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.116.w2.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.116.w3.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.117.w1.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.117.w2.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.117.w3.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.118.w1.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.118.w2.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.118.w3.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.119.w1.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.119.w2.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.119.w3.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.12.w1.weight": "consolidated-00006-of-00272.safetensors", + "layers.11.experts.12.w2.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.12.w3.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.120.w1.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.120.w2.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.120.w3.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.121.w1.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.121.w2.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.121.w3.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.122.w1.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.122.w2.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.122.w3.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.123.w1.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.123.w2.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.123.w3.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.124.w1.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.124.w2.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.124.w3.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.125.w1.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.125.w2.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.125.w3.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.126.w1.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.126.w2.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.126.w3.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.127.w1.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.127.w2.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.127.w3.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.13.w1.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.13.w2.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.13.w3.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.14.w1.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.14.w2.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.14.w3.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.15.w1.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.15.w2.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.15.w3.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.16.w1.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.16.w2.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.16.w3.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.17.w1.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.17.w2.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.17.w3.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.18.w1.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.18.w2.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.18.w3.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.19.w1.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.19.w2.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.19.w3.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.2.w1.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.2.w2.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.2.w3.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.20.w1.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.20.w2.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.20.w3.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.21.w1.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.21.w2.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.21.w3.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.22.w1.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.22.w2.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.22.w3.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.23.w1.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.23.w2.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.23.w3.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.24.w1.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.24.w2.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.24.w3.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.25.w1.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.25.w2.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.25.w3.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.26.w1.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.26.w2.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.26.w3.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.27.w1.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.27.w2.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.27.w3.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.28.w1.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.28.w2.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.28.w3.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.29.w1.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.29.w2.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.29.w3.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.3.w1.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.3.w2.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.3.w3.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.30.w1.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.30.w2.weight": "consolidated-00007-of-00272.safetensors", + "layers.11.experts.30.w3.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.31.w1.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.31.w2.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.31.w3.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.32.w1.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.32.w2.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.32.w3.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.33.w1.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.33.w2.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.33.w3.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.34.w1.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.34.w2.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.34.w3.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.35.w1.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.35.w2.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.35.w3.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.36.w1.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.36.w2.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.36.w3.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.37.w1.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.37.w2.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.37.w3.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.38.w1.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.38.w2.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.38.w3.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.39.w1.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.39.w2.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.39.w3.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.4.w1.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.4.w2.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.4.w3.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.40.w1.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.40.w2.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.40.w3.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.41.w1.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.41.w2.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.41.w3.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.42.w1.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.42.w2.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.42.w3.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.43.w1.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.43.w2.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.43.w3.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.44.w1.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.44.w2.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.44.w3.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.45.w1.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.45.w2.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.45.w3.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.46.w1.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.46.w2.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.46.w3.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.47.w1.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.47.w2.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.47.w3.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.48.w1.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.48.w2.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.48.w3.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.49.w1.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.49.w2.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.49.w3.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.5.w1.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.5.w2.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.5.w3.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.50.w1.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.50.w2.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.50.w3.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.51.w1.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.51.w2.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.51.w3.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.52.w1.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.52.w2.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.52.w3.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.53.w1.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.53.w2.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.53.w3.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.54.w1.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.54.w2.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.54.w3.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.55.w1.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.55.w2.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.55.w3.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.56.w1.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.56.w2.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.56.w3.weight": "consolidated-00008-of-00272.safetensors", + "layers.11.experts.57.w1.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.57.w2.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.57.w3.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.58.w1.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.58.w2.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.58.w3.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.59.w1.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.59.w2.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.59.w3.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.6.w1.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.6.w2.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.6.w3.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.60.w1.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.60.w2.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.60.w3.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.61.w1.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.61.w2.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.61.w3.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.62.w1.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.62.w2.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.62.w3.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.63.w1.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.63.w2.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.63.w3.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.64.w1.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.64.w2.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.64.w3.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.65.w1.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.65.w2.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.65.w3.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.66.w1.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.66.w2.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.66.w3.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.67.w1.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.67.w2.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.67.w3.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.68.w1.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.68.w2.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.68.w3.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.69.w1.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.69.w2.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.69.w3.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.7.w1.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.7.w2.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.7.w3.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.70.w1.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.70.w2.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.70.w3.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.71.w1.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.71.w2.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.71.w3.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.72.w1.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.72.w2.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.72.w3.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.73.w1.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.73.w2.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.73.w3.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.74.w1.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.74.w2.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.74.w3.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.75.w1.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.75.w2.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.75.w3.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.76.w1.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.76.w2.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.76.w3.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.77.w1.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.77.w2.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.77.w3.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.78.w1.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.78.w2.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.78.w3.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.79.w1.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.79.w2.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.79.w3.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.8.w1.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.8.w2.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.8.w3.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.80.w1.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.80.w2.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.80.w3.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.81.w1.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.81.w2.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.81.w3.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.82.w1.weight": "consolidated-00009-of-00272.safetensors", + "layers.11.experts.82.w2.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.82.w3.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.83.w1.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.83.w2.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.83.w3.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.84.w1.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.84.w2.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.84.w3.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.85.w1.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.85.w2.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.85.w3.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.86.w1.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.86.w2.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.86.w3.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.87.w1.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.87.w2.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.87.w3.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.88.w1.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.88.w2.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.88.w3.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.89.w1.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.89.w2.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.89.w3.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.9.w1.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.9.w2.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.9.w3.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.90.w1.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.90.w2.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.90.w3.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.91.w1.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.91.w2.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.91.w3.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.92.w1.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.92.w2.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.92.w3.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.93.w1.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.93.w2.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.93.w3.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.94.w1.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.94.w2.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.94.w3.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.95.w1.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.95.w2.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.95.w3.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.96.w1.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.96.w2.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.96.w3.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.97.w1.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.97.w2.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.97.w3.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.98.w1.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.98.w2.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.98.w3.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.99.w1.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.99.w2.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.experts.99.w3.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.ffn_norm.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.gate.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.shared_experts.w1.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.shared_experts.w2.weight": "consolidated-00010-of-00272.safetensors", + "layers.11.shared_experts.w3.weight": "consolidated-00010-of-00272.safetensors", + "layers.12.attention.kv_a_norm.weight": "consolidated-00010-of-00272.safetensors", + "layers.12.attention.q_a_norm.weight": "consolidated-00010-of-00272.safetensors", + "layers.12.attention.wkv_a_with_mqa.weight": "consolidated-00010-of-00272.safetensors", + "layers.12.attention.wkv_b.weight": "consolidated-00010-of-00272.safetensors", + "layers.12.attention.wo.weight": "consolidated-00010-of-00272.safetensors", + "layers.12.attention.wq_a.weight": "consolidated-00010-of-00272.safetensors", + "layers.12.attention.wq_b.weight": "consolidated-00010-of-00272.safetensors", + "layers.12.attention_norm.weight": "consolidated-00010-of-00272.safetensors", + "layers.12.experts.0.w1.weight": "consolidated-00010-of-00272.safetensors", + "layers.12.experts.0.w2.weight": "consolidated-00010-of-00272.safetensors", + "layers.12.experts.0.w3.weight": "consolidated-00010-of-00272.safetensors", + "layers.12.experts.1.w1.weight": "consolidated-00010-of-00272.safetensors", + "layers.12.experts.1.w2.weight": "consolidated-00010-of-00272.safetensors", + "layers.12.experts.1.w3.weight": "consolidated-00010-of-00272.safetensors", + "layers.12.experts.10.w1.weight": "consolidated-00010-of-00272.safetensors", + "layers.12.experts.10.w2.weight": "consolidated-00010-of-00272.safetensors", + "layers.12.experts.10.w3.weight": "consolidated-00010-of-00272.safetensors", + "layers.12.experts.100.w1.weight": "consolidated-00010-of-00272.safetensors", + "layers.12.experts.100.w2.weight": "consolidated-00010-of-00272.safetensors", + "layers.12.experts.100.w3.weight": "consolidated-00010-of-00272.safetensors", + "layers.12.experts.101.w1.weight": "consolidated-00010-of-00272.safetensors", + "layers.12.experts.101.w2.weight": "consolidated-00010-of-00272.safetensors", + "layers.12.experts.101.w3.weight": "consolidated-00010-of-00272.safetensors", + "layers.12.experts.102.w1.weight": "consolidated-00010-of-00272.safetensors", + "layers.12.experts.102.w2.weight": "consolidated-00010-of-00272.safetensors", + "layers.12.experts.102.w3.weight": "consolidated-00010-of-00272.safetensors", + "layers.12.experts.103.w1.weight": "consolidated-00010-of-00272.safetensors", + "layers.12.experts.103.w2.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.103.w3.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.104.w1.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.104.w2.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.104.w3.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.105.w1.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.105.w2.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.105.w3.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.106.w1.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.106.w2.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.106.w3.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.107.w1.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.107.w2.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.107.w3.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.108.w1.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.108.w2.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.108.w3.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.109.w1.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.109.w2.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.109.w3.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.11.w1.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.11.w2.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.11.w3.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.110.w1.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.110.w2.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.110.w3.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.111.w1.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.111.w2.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.111.w3.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.112.w1.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.112.w2.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.112.w3.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.113.w1.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.113.w2.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.113.w3.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.114.w1.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.114.w2.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.114.w3.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.115.w1.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.115.w2.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.115.w3.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.116.w1.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.116.w2.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.116.w3.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.117.w1.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.117.w2.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.117.w3.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.118.w1.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.118.w2.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.118.w3.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.119.w1.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.119.w2.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.119.w3.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.12.w1.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.12.w2.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.12.w3.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.120.w1.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.120.w2.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.120.w3.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.121.w1.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.121.w2.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.121.w3.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.122.w1.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.122.w2.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.122.w3.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.123.w1.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.123.w2.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.123.w3.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.124.w1.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.124.w2.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.124.w3.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.125.w1.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.125.w2.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.125.w3.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.126.w1.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.126.w2.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.126.w3.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.127.w1.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.127.w2.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.127.w3.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.13.w1.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.13.w2.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.13.w3.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.14.w1.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.14.w2.weight": "consolidated-00011-of-00272.safetensors", + "layers.12.experts.14.w3.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.15.w1.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.15.w2.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.15.w3.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.16.w1.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.16.w2.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.16.w3.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.17.w1.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.17.w2.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.17.w3.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.18.w1.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.18.w2.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.18.w3.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.19.w1.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.19.w2.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.19.w3.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.2.w1.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.2.w2.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.2.w3.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.20.w1.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.20.w2.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.20.w3.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.21.w1.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.21.w2.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.21.w3.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.22.w1.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.22.w2.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.22.w3.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.23.w1.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.23.w2.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.23.w3.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.24.w1.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.24.w2.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.24.w3.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.25.w1.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.25.w2.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.25.w3.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.26.w1.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.26.w2.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.26.w3.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.27.w1.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.27.w2.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.27.w3.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.28.w1.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.28.w2.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.28.w3.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.29.w1.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.29.w2.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.29.w3.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.3.w1.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.3.w2.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.3.w3.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.30.w1.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.30.w2.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.30.w3.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.31.w1.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.31.w2.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.31.w3.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.32.w1.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.32.w2.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.32.w3.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.33.w1.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.33.w2.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.33.w3.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.34.w1.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.34.w2.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.34.w3.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.35.w1.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.35.w2.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.35.w3.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.36.w1.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.36.w2.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.36.w3.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.37.w1.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.37.w2.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.37.w3.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.38.w1.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.38.w2.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.38.w3.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.39.w1.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.39.w2.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.39.w3.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.4.w1.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.4.w2.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.4.w3.weight": "consolidated-00012-of-00272.safetensors", + "layers.12.experts.40.w1.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.40.w2.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.40.w3.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.41.w1.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.41.w2.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.41.w3.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.42.w1.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.42.w2.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.42.w3.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.43.w1.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.43.w2.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.43.w3.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.44.w1.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.44.w2.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.44.w3.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.45.w1.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.45.w2.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.45.w3.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.46.w1.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.46.w2.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.46.w3.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.47.w1.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.47.w2.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.47.w3.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.48.w1.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.48.w2.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.48.w3.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.49.w1.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.49.w2.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.49.w3.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.5.w1.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.5.w2.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.5.w3.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.50.w1.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.50.w2.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.50.w3.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.51.w1.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.51.w2.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.51.w3.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.52.w1.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.52.w2.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.52.w3.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.53.w1.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.53.w2.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.53.w3.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.54.w1.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.54.w2.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.54.w3.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.55.w1.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.55.w2.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.55.w3.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.56.w1.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.56.w2.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.56.w3.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.57.w1.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.57.w2.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.57.w3.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.58.w1.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.58.w2.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.58.w3.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.59.w1.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.59.w2.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.59.w3.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.6.w1.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.6.w2.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.6.w3.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.60.w1.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.60.w2.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.60.w3.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.61.w1.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.61.w2.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.61.w3.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.62.w1.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.62.w2.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.62.w3.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.63.w1.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.63.w2.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.63.w3.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.64.w1.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.64.w2.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.64.w3.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.65.w1.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.65.w2.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.65.w3.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.66.w1.weight": "consolidated-00013-of-00272.safetensors", + "layers.12.experts.66.w2.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.66.w3.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.67.w1.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.67.w2.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.67.w3.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.68.w1.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.68.w2.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.68.w3.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.69.w1.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.69.w2.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.69.w3.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.7.w1.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.7.w2.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.7.w3.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.70.w1.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.70.w2.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.70.w3.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.71.w1.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.71.w2.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.71.w3.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.72.w1.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.72.w2.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.72.w3.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.73.w1.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.73.w2.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.73.w3.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.74.w1.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.74.w2.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.74.w3.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.75.w1.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.75.w2.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.75.w3.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.76.w1.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.76.w2.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.76.w3.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.77.w1.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.77.w2.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.77.w3.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.78.w1.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.78.w2.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.78.w3.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.79.w1.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.79.w2.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.79.w3.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.8.w1.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.8.w2.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.8.w3.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.80.w1.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.80.w2.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.80.w3.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.81.w1.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.81.w2.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.81.w3.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.82.w1.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.82.w2.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.82.w3.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.83.w1.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.83.w2.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.83.w3.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.84.w1.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.84.w2.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.84.w3.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.85.w1.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.85.w2.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.85.w3.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.86.w1.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.86.w2.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.86.w3.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.87.w1.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.87.w2.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.87.w3.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.88.w1.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.88.w2.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.88.w3.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.89.w1.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.89.w2.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.89.w3.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.9.w1.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.9.w2.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.9.w3.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.90.w1.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.90.w2.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.90.w3.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.91.w1.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.91.w2.weight": "consolidated-00014-of-00272.safetensors", + "layers.12.experts.91.w3.weight": "consolidated-00015-of-00272.safetensors", + "layers.12.experts.92.w1.weight": "consolidated-00015-of-00272.safetensors", + "layers.12.experts.92.w2.weight": "consolidated-00015-of-00272.safetensors", + "layers.12.experts.92.w3.weight": "consolidated-00015-of-00272.safetensors", + "layers.12.experts.93.w1.weight": "consolidated-00015-of-00272.safetensors", + "layers.12.experts.93.w2.weight": "consolidated-00015-of-00272.safetensors", + "layers.12.experts.93.w3.weight": "consolidated-00015-of-00272.safetensors", + "layers.12.experts.94.w1.weight": "consolidated-00015-of-00272.safetensors", + "layers.12.experts.94.w2.weight": "consolidated-00015-of-00272.safetensors", + "layers.12.experts.94.w3.weight": "consolidated-00015-of-00272.safetensors", + "layers.12.experts.95.w1.weight": "consolidated-00015-of-00272.safetensors", + "layers.12.experts.95.w2.weight": "consolidated-00015-of-00272.safetensors", + "layers.12.experts.95.w3.weight": "consolidated-00015-of-00272.safetensors", + "layers.12.experts.96.w1.weight": "consolidated-00015-of-00272.safetensors", + "layers.12.experts.96.w2.weight": "consolidated-00015-of-00272.safetensors", + "layers.12.experts.96.w3.weight": "consolidated-00015-of-00272.safetensors", + "layers.12.experts.97.w1.weight": "consolidated-00015-of-00272.safetensors", + "layers.12.experts.97.w2.weight": "consolidated-00015-of-00272.safetensors", + "layers.12.experts.97.w3.weight": "consolidated-00015-of-00272.safetensors", + "layers.12.experts.98.w1.weight": "consolidated-00015-of-00272.safetensors", + "layers.12.experts.98.w2.weight": "consolidated-00015-of-00272.safetensors", + "layers.12.experts.98.w3.weight": "consolidated-00015-of-00272.safetensors", + "layers.12.experts.99.w1.weight": "consolidated-00015-of-00272.safetensors", + "layers.12.experts.99.w2.weight": "consolidated-00015-of-00272.safetensors", + "layers.12.experts.99.w3.weight": "consolidated-00015-of-00272.safetensors", + "layers.12.ffn_norm.weight": "consolidated-00015-of-00272.safetensors", + "layers.12.gate.weight": "consolidated-00015-of-00272.safetensors", + "layers.12.shared_experts.w1.weight": "consolidated-00015-of-00272.safetensors", + "layers.12.shared_experts.w2.weight": "consolidated-00015-of-00272.safetensors", + "layers.12.shared_experts.w3.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.attention.kv_a_norm.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.attention.q_a_norm.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.attention.wkv_a_with_mqa.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.attention.wkv_b.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.attention.wo.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.attention.wq_a.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.attention.wq_b.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.attention_norm.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.0.w1.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.0.w2.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.0.w3.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.1.w1.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.1.w2.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.1.w3.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.10.w1.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.10.w2.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.10.w3.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.100.w1.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.100.w2.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.100.w3.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.101.w1.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.101.w2.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.101.w3.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.102.w1.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.102.w2.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.102.w3.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.103.w1.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.103.w2.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.103.w3.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.104.w1.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.104.w2.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.104.w3.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.105.w1.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.105.w2.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.105.w3.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.106.w1.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.106.w2.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.106.w3.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.107.w1.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.107.w2.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.107.w3.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.108.w1.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.108.w2.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.108.w3.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.109.w1.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.109.w2.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.109.w3.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.11.w1.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.11.w2.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.11.w3.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.110.w1.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.110.w2.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.110.w3.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.111.w1.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.111.w2.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.111.w3.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.112.w1.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.112.w2.weight": "consolidated-00015-of-00272.safetensors", + "layers.13.experts.112.w3.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.113.w1.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.113.w2.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.113.w3.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.114.w1.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.114.w2.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.114.w3.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.115.w1.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.115.w2.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.115.w3.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.116.w1.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.116.w2.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.116.w3.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.117.w1.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.117.w2.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.117.w3.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.118.w1.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.118.w2.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.118.w3.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.119.w1.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.119.w2.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.119.w3.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.12.w1.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.12.w2.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.12.w3.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.120.w1.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.120.w2.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.120.w3.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.121.w1.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.121.w2.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.121.w3.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.122.w1.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.122.w2.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.122.w3.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.123.w1.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.123.w2.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.123.w3.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.124.w1.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.124.w2.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.124.w3.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.125.w1.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.125.w2.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.125.w3.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.126.w1.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.126.w2.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.126.w3.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.127.w1.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.127.w2.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.127.w3.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.13.w1.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.13.w2.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.13.w3.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.14.w1.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.14.w2.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.14.w3.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.15.w1.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.15.w2.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.15.w3.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.16.w1.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.16.w2.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.16.w3.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.17.w1.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.17.w2.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.17.w3.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.18.w1.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.18.w2.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.18.w3.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.19.w1.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.19.w2.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.19.w3.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.2.w1.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.2.w2.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.2.w3.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.20.w1.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.20.w2.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.20.w3.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.21.w1.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.21.w2.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.21.w3.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.22.w1.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.22.w2.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.22.w3.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.23.w1.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.23.w2.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.23.w3.weight": "consolidated-00016-of-00272.safetensors", + "layers.13.experts.24.w1.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.24.w2.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.24.w3.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.25.w1.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.25.w2.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.25.w3.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.26.w1.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.26.w2.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.26.w3.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.27.w1.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.27.w2.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.27.w3.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.28.w1.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.28.w2.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.28.w3.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.29.w1.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.29.w2.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.29.w3.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.3.w1.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.3.w2.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.3.w3.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.30.w1.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.30.w2.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.30.w3.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.31.w1.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.31.w2.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.31.w3.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.32.w1.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.32.w2.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.32.w3.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.33.w1.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.33.w2.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.33.w3.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.34.w1.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.34.w2.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.34.w3.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.35.w1.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.35.w2.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.35.w3.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.36.w1.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.36.w2.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.36.w3.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.37.w1.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.37.w2.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.37.w3.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.38.w1.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.38.w2.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.38.w3.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.39.w1.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.39.w2.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.39.w3.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.4.w1.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.4.w2.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.4.w3.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.40.w1.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.40.w2.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.40.w3.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.41.w1.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.41.w2.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.41.w3.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.42.w1.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.42.w2.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.42.w3.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.43.w1.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.43.w2.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.43.w3.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.44.w1.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.44.w2.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.44.w3.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.45.w1.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.45.w2.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.45.w3.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.46.w1.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.46.w2.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.46.w3.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.47.w1.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.47.w2.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.47.w3.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.48.w1.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.48.w2.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.48.w3.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.49.w1.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.49.w2.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.49.w3.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.5.w1.weight": "consolidated-00017-of-00272.safetensors", + "layers.13.experts.5.w2.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.5.w3.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.50.w1.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.50.w2.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.50.w3.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.51.w1.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.51.w2.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.51.w3.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.52.w1.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.52.w2.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.52.w3.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.53.w1.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.53.w2.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.53.w3.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.54.w1.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.54.w2.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.54.w3.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.55.w1.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.55.w2.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.55.w3.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.56.w1.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.56.w2.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.56.w3.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.57.w1.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.57.w2.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.57.w3.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.58.w1.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.58.w2.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.58.w3.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.59.w1.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.59.w2.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.59.w3.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.6.w1.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.6.w2.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.6.w3.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.60.w1.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.60.w2.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.60.w3.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.61.w1.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.61.w2.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.61.w3.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.62.w1.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.62.w2.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.62.w3.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.63.w1.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.63.w2.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.63.w3.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.64.w1.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.64.w2.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.64.w3.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.65.w1.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.65.w2.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.65.w3.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.66.w1.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.66.w2.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.66.w3.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.67.w1.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.67.w2.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.67.w3.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.68.w1.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.68.w2.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.68.w3.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.69.w1.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.69.w2.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.69.w3.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.7.w1.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.7.w2.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.7.w3.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.70.w1.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.70.w2.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.70.w3.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.71.w1.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.71.w2.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.71.w3.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.72.w1.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.72.w2.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.72.w3.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.73.w1.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.73.w2.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.73.w3.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.74.w1.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.74.w2.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.74.w3.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.75.w1.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.75.w2.weight": "consolidated-00018-of-00272.safetensors", + "layers.13.experts.75.w3.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.76.w1.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.76.w2.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.76.w3.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.77.w1.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.77.w2.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.77.w3.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.78.w1.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.78.w2.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.78.w3.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.79.w1.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.79.w2.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.79.w3.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.8.w1.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.8.w2.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.8.w3.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.80.w1.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.80.w2.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.80.w3.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.81.w1.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.81.w2.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.81.w3.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.82.w1.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.82.w2.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.82.w3.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.83.w1.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.83.w2.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.83.w3.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.84.w1.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.84.w2.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.84.w3.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.85.w1.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.85.w2.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.85.w3.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.86.w1.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.86.w2.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.86.w3.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.87.w1.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.87.w2.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.87.w3.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.88.w1.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.88.w2.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.88.w3.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.89.w1.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.89.w2.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.89.w3.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.9.w1.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.9.w2.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.9.w3.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.90.w1.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.90.w2.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.90.w3.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.91.w1.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.91.w2.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.91.w3.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.92.w1.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.92.w2.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.92.w3.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.93.w1.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.93.w2.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.93.w3.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.94.w1.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.94.w2.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.94.w3.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.95.w1.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.95.w2.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.95.w3.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.96.w1.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.96.w2.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.96.w3.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.97.w1.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.97.w2.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.97.w3.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.98.w1.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.98.w2.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.98.w3.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.99.w1.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.99.w2.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.experts.99.w3.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.ffn_norm.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.gate.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.shared_experts.w1.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.shared_experts.w2.weight": "consolidated-00019-of-00272.safetensors", + "layers.13.shared_experts.w3.weight": "consolidated-00019-of-00272.safetensors", + "layers.14.attention.kv_a_norm.weight": "consolidated-00019-of-00272.safetensors", + "layers.14.attention.q_a_norm.weight": "consolidated-00019-of-00272.safetensors", + "layers.14.attention.wkv_a_with_mqa.weight": "consolidated-00019-of-00272.safetensors", + "layers.14.attention.wkv_b.weight": "consolidated-00019-of-00272.safetensors", + "layers.14.attention.wo.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.attention.wq_a.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.attention.wq_b.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.attention_norm.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.0.w1.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.0.w2.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.0.w3.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.1.w1.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.1.w2.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.1.w3.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.10.w1.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.10.w2.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.10.w3.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.100.w1.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.100.w2.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.100.w3.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.101.w1.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.101.w2.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.101.w3.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.102.w1.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.102.w2.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.102.w3.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.103.w1.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.103.w2.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.103.w3.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.104.w1.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.104.w2.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.104.w3.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.105.w1.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.105.w2.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.105.w3.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.106.w1.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.106.w2.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.106.w3.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.107.w1.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.107.w2.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.107.w3.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.108.w1.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.108.w2.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.108.w3.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.109.w1.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.109.w2.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.109.w3.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.11.w1.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.11.w2.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.11.w3.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.110.w1.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.110.w2.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.110.w3.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.111.w1.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.111.w2.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.111.w3.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.112.w1.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.112.w2.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.112.w3.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.113.w1.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.113.w2.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.113.w3.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.114.w1.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.114.w2.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.114.w3.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.115.w1.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.115.w2.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.115.w3.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.116.w1.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.116.w2.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.116.w3.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.117.w1.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.117.w2.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.117.w3.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.118.w1.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.118.w2.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.118.w3.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.119.w1.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.119.w2.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.119.w3.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.12.w1.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.12.w2.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.12.w3.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.120.w1.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.120.w2.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.120.w3.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.121.w1.weight": "consolidated-00020-of-00272.safetensors", + "layers.14.experts.121.w2.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.121.w3.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.122.w1.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.122.w2.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.122.w3.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.123.w1.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.123.w2.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.123.w3.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.124.w1.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.124.w2.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.124.w3.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.125.w1.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.125.w2.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.125.w3.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.126.w1.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.126.w2.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.126.w3.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.127.w1.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.127.w2.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.127.w3.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.13.w1.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.13.w2.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.13.w3.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.14.w1.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.14.w2.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.14.w3.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.15.w1.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.15.w2.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.15.w3.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.16.w1.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.16.w2.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.16.w3.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.17.w1.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.17.w2.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.17.w3.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.18.w1.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.18.w2.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.18.w3.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.19.w1.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.19.w2.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.19.w3.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.2.w1.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.2.w2.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.2.w3.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.20.w1.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.20.w2.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.20.w3.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.21.w1.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.21.w2.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.21.w3.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.22.w1.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.22.w2.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.22.w3.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.23.w1.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.23.w2.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.23.w3.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.24.w1.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.24.w2.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.24.w3.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.25.w1.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.25.w2.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.25.w3.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.26.w1.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.26.w2.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.26.w3.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.27.w1.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.27.w2.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.27.w3.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.28.w1.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.28.w2.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.28.w3.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.29.w1.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.29.w2.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.29.w3.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.3.w1.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.3.w2.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.3.w3.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.30.w1.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.30.w2.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.30.w3.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.31.w1.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.31.w2.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.31.w3.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.32.w1.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.32.w2.weight": "consolidated-00021-of-00272.safetensors", + "layers.14.experts.32.w3.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.33.w1.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.33.w2.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.33.w3.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.34.w1.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.34.w2.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.34.w3.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.35.w1.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.35.w2.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.35.w3.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.36.w1.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.36.w2.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.36.w3.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.37.w1.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.37.w2.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.37.w3.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.38.w1.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.38.w2.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.38.w3.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.39.w1.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.39.w2.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.39.w3.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.4.w1.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.4.w2.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.4.w3.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.40.w1.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.40.w2.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.40.w3.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.41.w1.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.41.w2.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.41.w3.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.42.w1.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.42.w2.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.42.w3.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.43.w1.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.43.w2.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.43.w3.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.44.w1.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.44.w2.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.44.w3.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.45.w1.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.45.w2.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.45.w3.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.46.w1.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.46.w2.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.46.w3.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.47.w1.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.47.w2.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.47.w3.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.48.w1.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.48.w2.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.48.w3.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.49.w1.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.49.w2.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.49.w3.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.5.w1.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.5.w2.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.5.w3.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.50.w1.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.50.w2.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.50.w3.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.51.w1.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.51.w2.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.51.w3.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.52.w1.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.52.w2.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.52.w3.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.53.w1.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.53.w2.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.53.w3.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.54.w1.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.54.w2.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.54.w3.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.55.w1.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.55.w2.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.55.w3.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.56.w1.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.56.w2.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.56.w3.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.57.w1.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.57.w2.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.57.w3.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.58.w1.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.58.w2.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.58.w3.weight": "consolidated-00022-of-00272.safetensors", + "layers.14.experts.59.w1.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.59.w2.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.59.w3.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.6.w1.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.6.w2.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.6.w3.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.60.w1.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.60.w2.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.60.w3.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.61.w1.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.61.w2.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.61.w3.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.62.w1.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.62.w2.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.62.w3.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.63.w1.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.63.w2.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.63.w3.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.64.w1.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.64.w2.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.64.w3.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.65.w1.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.65.w2.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.65.w3.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.66.w1.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.66.w2.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.66.w3.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.67.w1.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.67.w2.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.67.w3.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.68.w1.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.68.w2.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.68.w3.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.69.w1.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.69.w2.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.69.w3.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.7.w1.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.7.w2.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.7.w3.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.70.w1.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.70.w2.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.70.w3.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.71.w1.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.71.w2.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.71.w3.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.72.w1.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.72.w2.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.72.w3.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.73.w1.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.73.w2.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.73.w3.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.74.w1.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.74.w2.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.74.w3.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.75.w1.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.75.w2.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.75.w3.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.76.w1.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.76.w2.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.76.w3.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.77.w1.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.77.w2.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.77.w3.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.78.w1.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.78.w2.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.78.w3.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.79.w1.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.79.w2.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.79.w3.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.8.w1.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.8.w2.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.8.w3.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.80.w1.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.80.w2.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.80.w3.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.81.w1.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.81.w2.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.81.w3.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.82.w1.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.82.w2.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.82.w3.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.83.w1.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.83.w2.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.83.w3.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.84.w1.weight": "consolidated-00023-of-00272.safetensors", + "layers.14.experts.84.w2.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.84.w3.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.85.w1.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.85.w2.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.85.w3.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.86.w1.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.86.w2.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.86.w3.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.87.w1.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.87.w2.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.87.w3.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.88.w1.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.88.w2.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.88.w3.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.89.w1.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.89.w2.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.89.w3.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.9.w1.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.9.w2.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.9.w3.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.90.w1.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.90.w2.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.90.w3.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.91.w1.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.91.w2.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.91.w3.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.92.w1.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.92.w2.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.92.w3.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.93.w1.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.93.w2.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.93.w3.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.94.w1.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.94.w2.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.94.w3.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.95.w1.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.95.w2.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.95.w3.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.96.w1.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.96.w2.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.96.w3.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.97.w1.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.97.w2.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.97.w3.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.98.w1.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.98.w2.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.98.w3.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.99.w1.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.99.w2.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.experts.99.w3.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.ffn_norm.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.gate.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.shared_experts.w1.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.shared_experts.w2.weight": "consolidated-00024-of-00272.safetensors", + "layers.14.shared_experts.w3.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.attention.kv_a_norm.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.attention.q_a_norm.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.attention.wkv_a_with_mqa.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.attention.wkv_b.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.attention.wo.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.attention.wq_a.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.attention.wq_b.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.attention_norm.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.experts.0.w1.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.experts.0.w2.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.experts.0.w3.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.experts.1.w1.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.experts.1.w2.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.experts.1.w3.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.experts.10.w1.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.experts.10.w2.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.experts.10.w3.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.experts.100.w1.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.experts.100.w2.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.experts.100.w3.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.experts.101.w1.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.experts.101.w2.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.experts.101.w3.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.experts.102.w1.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.experts.102.w2.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.experts.102.w3.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.experts.103.w1.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.experts.103.w2.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.experts.103.w3.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.experts.104.w1.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.experts.104.w2.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.experts.104.w3.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.experts.105.w1.weight": "consolidated-00024-of-00272.safetensors", + "layers.15.experts.105.w2.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.105.w3.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.106.w1.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.106.w2.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.106.w3.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.107.w1.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.107.w2.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.107.w3.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.108.w1.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.108.w2.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.108.w3.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.109.w1.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.109.w2.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.109.w3.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.11.w1.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.11.w2.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.11.w3.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.110.w1.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.110.w2.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.110.w3.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.111.w1.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.111.w2.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.111.w3.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.112.w1.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.112.w2.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.112.w3.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.113.w1.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.113.w2.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.113.w3.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.114.w1.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.114.w2.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.114.w3.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.115.w1.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.115.w2.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.115.w3.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.116.w1.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.116.w2.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.116.w3.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.117.w1.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.117.w2.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.117.w3.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.118.w1.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.118.w2.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.118.w3.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.119.w1.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.119.w2.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.119.w3.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.12.w1.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.12.w2.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.12.w3.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.120.w1.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.120.w2.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.120.w3.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.121.w1.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.121.w2.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.121.w3.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.122.w1.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.122.w2.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.122.w3.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.123.w1.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.123.w2.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.123.w3.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.124.w1.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.124.w2.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.124.w3.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.125.w1.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.125.w2.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.125.w3.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.126.w1.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.126.w2.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.126.w3.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.127.w1.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.127.w2.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.127.w3.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.13.w1.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.13.w2.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.13.w3.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.14.w1.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.14.w2.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.14.w3.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.15.w1.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.15.w2.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.15.w3.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.16.w1.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.16.w2.weight": "consolidated-00025-of-00272.safetensors", + "layers.15.experts.16.w3.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.17.w1.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.17.w2.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.17.w3.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.18.w1.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.18.w2.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.18.w3.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.19.w1.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.19.w2.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.19.w3.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.2.w1.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.2.w2.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.2.w3.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.20.w1.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.20.w2.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.20.w3.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.21.w1.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.21.w2.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.21.w3.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.22.w1.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.22.w2.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.22.w3.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.23.w1.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.23.w2.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.23.w3.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.24.w1.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.24.w2.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.24.w3.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.25.w1.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.25.w2.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.25.w3.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.26.w1.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.26.w2.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.26.w3.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.27.w1.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.27.w2.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.27.w3.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.28.w1.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.28.w2.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.28.w3.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.29.w1.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.29.w2.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.29.w3.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.3.w1.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.3.w2.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.3.w3.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.30.w1.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.30.w2.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.30.w3.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.31.w1.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.31.w2.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.31.w3.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.32.w1.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.32.w2.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.32.w3.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.33.w1.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.33.w2.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.33.w3.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.34.w1.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.34.w2.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.34.w3.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.35.w1.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.35.w2.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.35.w3.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.36.w1.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.36.w2.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.36.w3.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.37.w1.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.37.w2.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.37.w3.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.38.w1.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.38.w2.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.38.w3.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.39.w1.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.39.w2.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.39.w3.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.4.w1.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.4.w2.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.4.w3.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.40.w1.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.40.w2.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.40.w3.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.41.w1.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.41.w2.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.41.w3.weight": "consolidated-00026-of-00272.safetensors", + "layers.15.experts.42.w1.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.42.w2.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.42.w3.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.43.w1.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.43.w2.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.43.w3.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.44.w1.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.44.w2.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.44.w3.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.45.w1.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.45.w2.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.45.w3.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.46.w1.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.46.w2.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.46.w3.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.47.w1.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.47.w2.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.47.w3.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.48.w1.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.48.w2.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.48.w3.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.49.w1.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.49.w2.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.49.w3.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.5.w1.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.5.w2.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.5.w3.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.50.w1.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.50.w2.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.50.w3.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.51.w1.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.51.w2.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.51.w3.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.52.w1.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.52.w2.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.52.w3.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.53.w1.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.53.w2.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.53.w3.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.54.w1.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.54.w2.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.54.w3.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.55.w1.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.55.w2.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.55.w3.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.56.w1.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.56.w2.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.56.w3.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.57.w1.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.57.w2.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.57.w3.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.58.w1.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.58.w2.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.58.w3.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.59.w1.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.59.w2.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.59.w3.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.6.w1.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.6.w2.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.6.w3.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.60.w1.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.60.w2.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.60.w3.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.61.w1.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.61.w2.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.61.w3.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.62.w1.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.62.w2.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.62.w3.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.63.w1.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.63.w2.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.63.w3.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.64.w1.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.64.w2.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.64.w3.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.65.w1.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.65.w2.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.65.w3.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.66.w1.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.66.w2.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.66.w3.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.67.w1.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.67.w2.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.67.w3.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.68.w1.weight": "consolidated-00027-of-00272.safetensors", + "layers.15.experts.68.w2.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.68.w3.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.69.w1.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.69.w2.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.69.w3.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.7.w1.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.7.w2.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.7.w3.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.70.w1.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.70.w2.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.70.w3.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.71.w1.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.71.w2.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.71.w3.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.72.w1.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.72.w2.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.72.w3.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.73.w1.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.73.w2.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.73.w3.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.74.w1.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.74.w2.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.74.w3.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.75.w1.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.75.w2.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.75.w3.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.76.w1.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.76.w2.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.76.w3.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.77.w1.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.77.w2.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.77.w3.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.78.w1.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.78.w2.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.78.w3.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.79.w1.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.79.w2.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.79.w3.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.8.w1.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.8.w2.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.8.w3.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.80.w1.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.80.w2.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.80.w3.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.81.w1.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.81.w2.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.81.w3.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.82.w1.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.82.w2.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.82.w3.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.83.w1.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.83.w2.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.83.w3.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.84.w1.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.84.w2.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.84.w3.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.85.w1.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.85.w2.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.85.w3.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.86.w1.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.86.w2.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.86.w3.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.87.w1.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.87.w2.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.87.w3.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.88.w1.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.88.w2.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.88.w3.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.89.w1.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.89.w2.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.89.w3.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.9.w1.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.9.w2.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.9.w3.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.90.w1.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.90.w2.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.90.w3.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.91.w1.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.91.w2.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.91.w3.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.92.w1.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.92.w2.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.92.w3.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.93.w1.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.93.w2.weight": "consolidated-00028-of-00272.safetensors", + "layers.15.experts.93.w3.weight": "consolidated-00029-of-00272.safetensors", + "layers.15.experts.94.w1.weight": "consolidated-00029-of-00272.safetensors", + "layers.15.experts.94.w2.weight": "consolidated-00029-of-00272.safetensors", + "layers.15.experts.94.w3.weight": "consolidated-00029-of-00272.safetensors", + "layers.15.experts.95.w1.weight": "consolidated-00029-of-00272.safetensors", + "layers.15.experts.95.w2.weight": "consolidated-00029-of-00272.safetensors", + "layers.15.experts.95.w3.weight": "consolidated-00029-of-00272.safetensors", + "layers.15.experts.96.w1.weight": "consolidated-00029-of-00272.safetensors", + "layers.15.experts.96.w2.weight": "consolidated-00029-of-00272.safetensors", + "layers.15.experts.96.w3.weight": "consolidated-00029-of-00272.safetensors", + "layers.15.experts.97.w1.weight": "consolidated-00029-of-00272.safetensors", + "layers.15.experts.97.w2.weight": "consolidated-00029-of-00272.safetensors", + "layers.15.experts.97.w3.weight": "consolidated-00029-of-00272.safetensors", + "layers.15.experts.98.w1.weight": "consolidated-00029-of-00272.safetensors", + "layers.15.experts.98.w2.weight": "consolidated-00029-of-00272.safetensors", + "layers.15.experts.98.w3.weight": "consolidated-00029-of-00272.safetensors", + "layers.15.experts.99.w1.weight": "consolidated-00029-of-00272.safetensors", + "layers.15.experts.99.w2.weight": "consolidated-00029-of-00272.safetensors", + "layers.15.experts.99.w3.weight": "consolidated-00029-of-00272.safetensors", + "layers.15.ffn_norm.weight": "consolidated-00029-of-00272.safetensors", + "layers.15.gate.weight": "consolidated-00029-of-00272.safetensors", + "layers.15.shared_experts.w1.weight": "consolidated-00029-of-00272.safetensors", + "layers.15.shared_experts.w2.weight": "consolidated-00029-of-00272.safetensors", + "layers.15.shared_experts.w3.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.attention.kv_a_norm.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.attention.q_a_norm.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.attention.wkv_a_with_mqa.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.attention.wkv_b.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.attention.wo.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.attention.wq_a.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.attention.wq_b.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.attention_norm.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.0.w1.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.0.w2.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.0.w3.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.1.w1.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.1.w2.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.1.w3.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.10.w1.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.10.w2.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.10.w3.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.100.w1.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.100.w2.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.100.w3.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.101.w1.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.101.w2.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.101.w3.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.102.w1.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.102.w2.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.102.w3.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.103.w1.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.103.w2.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.103.w3.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.104.w1.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.104.w2.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.104.w3.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.105.w1.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.105.w2.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.105.w3.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.106.w1.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.106.w2.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.106.w3.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.107.w1.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.107.w2.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.107.w3.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.108.w1.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.108.w2.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.108.w3.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.109.w1.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.109.w2.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.109.w3.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.11.w1.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.11.w2.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.11.w3.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.110.w1.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.110.w2.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.110.w3.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.111.w1.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.111.w2.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.111.w3.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.112.w1.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.112.w2.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.112.w3.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.113.w1.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.113.w2.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.113.w3.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.114.w1.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.114.w2.weight": "consolidated-00029-of-00272.safetensors", + "layers.16.experts.114.w3.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.115.w1.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.115.w2.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.115.w3.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.116.w1.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.116.w2.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.116.w3.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.117.w1.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.117.w2.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.117.w3.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.118.w1.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.118.w2.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.118.w3.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.119.w1.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.119.w2.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.119.w3.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.12.w1.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.12.w2.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.12.w3.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.120.w1.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.120.w2.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.120.w3.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.121.w1.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.121.w2.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.121.w3.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.122.w1.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.122.w2.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.122.w3.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.123.w1.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.123.w2.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.123.w3.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.124.w1.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.124.w2.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.124.w3.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.125.w1.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.125.w2.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.125.w3.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.126.w1.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.126.w2.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.126.w3.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.127.w1.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.127.w2.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.127.w3.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.13.w1.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.13.w2.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.13.w3.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.14.w1.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.14.w2.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.14.w3.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.15.w1.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.15.w2.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.15.w3.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.16.w1.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.16.w2.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.16.w3.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.17.w1.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.17.w2.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.17.w3.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.18.w1.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.18.w2.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.18.w3.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.19.w1.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.19.w2.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.19.w3.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.2.w1.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.2.w2.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.2.w3.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.20.w1.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.20.w2.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.20.w3.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.21.w1.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.21.w2.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.21.w3.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.22.w1.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.22.w2.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.22.w3.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.23.w1.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.23.w2.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.23.w3.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.24.w1.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.24.w2.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.24.w3.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.25.w1.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.25.w2.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.25.w3.weight": "consolidated-00030-of-00272.safetensors", + "layers.16.experts.26.w1.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.26.w2.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.26.w3.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.27.w1.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.27.w2.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.27.w3.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.28.w1.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.28.w2.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.28.w3.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.29.w1.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.29.w2.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.29.w3.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.3.w1.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.3.w2.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.3.w3.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.30.w1.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.30.w2.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.30.w3.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.31.w1.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.31.w2.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.31.w3.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.32.w1.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.32.w2.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.32.w3.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.33.w1.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.33.w2.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.33.w3.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.34.w1.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.34.w2.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.34.w3.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.35.w1.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.35.w2.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.35.w3.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.36.w1.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.36.w2.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.36.w3.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.37.w1.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.37.w2.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.37.w3.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.38.w1.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.38.w2.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.38.w3.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.39.w1.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.39.w2.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.39.w3.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.4.w1.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.4.w2.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.4.w3.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.40.w1.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.40.w2.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.40.w3.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.41.w1.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.41.w2.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.41.w3.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.42.w1.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.42.w2.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.42.w3.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.43.w1.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.43.w2.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.43.w3.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.44.w1.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.44.w2.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.44.w3.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.45.w1.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.45.w2.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.45.w3.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.46.w1.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.46.w2.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.46.w3.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.47.w1.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.47.w2.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.47.w3.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.48.w1.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.48.w2.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.48.w3.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.49.w1.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.49.w2.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.49.w3.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.5.w1.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.5.w2.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.5.w3.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.50.w1.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.50.w2.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.50.w3.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.51.w1.weight": "consolidated-00031-of-00272.safetensors", + "layers.16.experts.51.w2.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.51.w3.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.52.w1.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.52.w2.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.52.w3.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.53.w1.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.53.w2.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.53.w3.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.54.w1.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.54.w2.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.54.w3.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.55.w1.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.55.w2.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.55.w3.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.56.w1.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.56.w2.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.56.w3.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.57.w1.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.57.w2.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.57.w3.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.58.w1.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.58.w2.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.58.w3.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.59.w1.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.59.w2.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.59.w3.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.6.w1.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.6.w2.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.6.w3.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.60.w1.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.60.w2.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.60.w3.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.61.w1.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.61.w2.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.61.w3.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.62.w1.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.62.w2.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.62.w3.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.63.w1.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.63.w2.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.63.w3.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.64.w1.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.64.w2.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.64.w3.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.65.w1.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.65.w2.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.65.w3.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.66.w1.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.66.w2.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.66.w3.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.67.w1.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.67.w2.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.67.w3.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.68.w1.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.68.w2.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.68.w3.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.69.w1.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.69.w2.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.69.w3.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.7.w1.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.7.w2.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.7.w3.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.70.w1.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.70.w2.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.70.w3.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.71.w1.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.71.w2.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.71.w3.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.72.w1.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.72.w2.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.72.w3.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.73.w1.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.73.w2.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.73.w3.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.74.w1.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.74.w2.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.74.w3.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.75.w1.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.75.w2.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.75.w3.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.76.w1.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.76.w2.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.76.w3.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.77.w1.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.77.w2.weight": "consolidated-00032-of-00272.safetensors", + "layers.16.experts.77.w3.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.78.w1.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.78.w2.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.78.w3.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.79.w1.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.79.w2.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.79.w3.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.8.w1.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.8.w2.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.8.w3.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.80.w1.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.80.w2.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.80.w3.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.81.w1.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.81.w2.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.81.w3.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.82.w1.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.82.w2.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.82.w3.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.83.w1.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.83.w2.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.83.w3.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.84.w1.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.84.w2.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.84.w3.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.85.w1.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.85.w2.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.85.w3.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.86.w1.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.86.w2.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.86.w3.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.87.w1.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.87.w2.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.87.w3.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.88.w1.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.88.w2.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.88.w3.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.89.w1.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.89.w2.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.89.w3.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.9.w1.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.9.w2.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.9.w3.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.90.w1.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.90.w2.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.90.w3.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.91.w1.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.91.w2.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.91.w3.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.92.w1.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.92.w2.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.92.w3.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.93.w1.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.93.w2.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.93.w3.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.94.w1.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.94.w2.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.94.w3.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.95.w1.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.95.w2.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.95.w3.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.96.w1.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.96.w2.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.96.w3.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.97.w1.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.97.w2.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.97.w3.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.98.w1.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.98.w2.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.98.w3.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.99.w1.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.99.w2.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.experts.99.w3.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.ffn_norm.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.gate.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.shared_experts.w1.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.shared_experts.w2.weight": "consolidated-00033-of-00272.safetensors", + "layers.16.shared_experts.w3.weight": "consolidated-00033-of-00272.safetensors", + "layers.17.attention.kv_a_norm.weight": "consolidated-00033-of-00272.safetensors", + "layers.17.attention.q_a_norm.weight": "consolidated-00033-of-00272.safetensors", + "layers.17.attention.wkv_a_with_mqa.weight": "consolidated-00033-of-00272.safetensors", + "layers.17.attention.wkv_b.weight": "consolidated-00033-of-00272.safetensors", + "layers.17.attention.wo.weight": "consolidated-00033-of-00272.safetensors", + "layers.17.attention.wq_a.weight": "consolidated-00033-of-00272.safetensors", + "layers.17.attention.wq_b.weight": "consolidated-00033-of-00272.safetensors", + "layers.17.attention_norm.weight": "consolidated-00033-of-00272.safetensors", + "layers.17.experts.0.w1.weight": "consolidated-00033-of-00272.safetensors", + "layers.17.experts.0.w2.weight": "consolidated-00033-of-00272.safetensors", + "layers.17.experts.0.w3.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.1.w1.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.1.w2.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.1.w3.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.10.w1.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.10.w2.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.10.w3.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.100.w1.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.100.w2.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.100.w3.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.101.w1.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.101.w2.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.101.w3.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.102.w1.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.102.w2.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.102.w3.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.103.w1.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.103.w2.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.103.w3.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.104.w1.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.104.w2.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.104.w3.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.105.w1.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.105.w2.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.105.w3.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.106.w1.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.106.w2.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.106.w3.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.107.w1.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.107.w2.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.107.w3.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.108.w1.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.108.w2.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.108.w3.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.109.w1.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.109.w2.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.109.w3.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.11.w1.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.11.w2.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.11.w3.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.110.w1.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.110.w2.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.110.w3.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.111.w1.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.111.w2.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.111.w3.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.112.w1.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.112.w2.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.112.w3.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.113.w1.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.113.w2.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.113.w3.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.114.w1.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.114.w2.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.114.w3.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.115.w1.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.115.w2.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.115.w3.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.116.w1.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.116.w2.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.116.w3.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.117.w1.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.117.w2.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.117.w3.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.118.w1.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.118.w2.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.118.w3.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.119.w1.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.119.w2.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.119.w3.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.12.w1.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.12.w2.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.12.w3.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.120.w1.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.120.w2.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.120.w3.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.121.w1.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.121.w2.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.121.w3.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.122.w1.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.122.w2.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.122.w3.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.123.w1.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.123.w2.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.123.w3.weight": "consolidated-00034-of-00272.safetensors", + "layers.17.experts.124.w1.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.124.w2.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.124.w3.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.125.w1.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.125.w2.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.125.w3.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.126.w1.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.126.w2.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.126.w3.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.127.w1.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.127.w2.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.127.w3.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.13.w1.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.13.w2.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.13.w3.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.14.w1.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.14.w2.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.14.w3.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.15.w1.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.15.w2.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.15.w3.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.16.w1.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.16.w2.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.16.w3.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.17.w1.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.17.w2.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.17.w3.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.18.w1.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.18.w2.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.18.w3.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.19.w1.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.19.w2.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.19.w3.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.2.w1.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.2.w2.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.2.w3.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.20.w1.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.20.w2.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.20.w3.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.21.w1.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.21.w2.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.21.w3.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.22.w1.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.22.w2.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.22.w3.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.23.w1.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.23.w2.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.23.w3.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.24.w1.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.24.w2.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.24.w3.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.25.w1.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.25.w2.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.25.w3.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.26.w1.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.26.w2.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.26.w3.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.27.w1.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.27.w2.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.27.w3.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.28.w1.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.28.w2.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.28.w3.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.29.w1.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.29.w2.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.29.w3.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.3.w1.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.3.w2.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.3.w3.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.30.w1.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.30.w2.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.30.w3.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.31.w1.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.31.w2.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.31.w3.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.32.w1.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.32.w2.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.32.w3.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.33.w1.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.33.w2.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.33.w3.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.34.w1.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.34.w2.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.34.w3.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.35.w1.weight": "consolidated-00035-of-00272.safetensors", + "layers.17.experts.35.w2.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.35.w3.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.36.w1.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.36.w2.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.36.w3.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.37.w1.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.37.w2.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.37.w3.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.38.w1.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.38.w2.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.38.w3.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.39.w1.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.39.w2.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.39.w3.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.4.w1.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.4.w2.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.4.w3.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.40.w1.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.40.w2.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.40.w3.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.41.w1.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.41.w2.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.41.w3.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.42.w1.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.42.w2.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.42.w3.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.43.w1.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.43.w2.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.43.w3.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.44.w1.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.44.w2.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.44.w3.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.45.w1.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.45.w2.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.45.w3.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.46.w1.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.46.w2.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.46.w3.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.47.w1.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.47.w2.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.47.w3.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.48.w1.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.48.w2.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.48.w3.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.49.w1.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.49.w2.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.49.w3.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.5.w1.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.5.w2.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.5.w3.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.50.w1.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.50.w2.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.50.w3.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.51.w1.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.51.w2.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.51.w3.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.52.w1.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.52.w2.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.52.w3.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.53.w1.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.53.w2.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.53.w3.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.54.w1.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.54.w2.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.54.w3.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.55.w1.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.55.w2.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.55.w3.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.56.w1.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.56.w2.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.56.w3.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.57.w1.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.57.w2.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.57.w3.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.58.w1.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.58.w2.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.58.w3.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.59.w1.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.59.w2.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.59.w3.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.6.w1.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.6.w2.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.6.w3.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.60.w1.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.60.w2.weight": "consolidated-00036-of-00272.safetensors", + "layers.17.experts.60.w3.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.61.w1.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.61.w2.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.61.w3.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.62.w1.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.62.w2.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.62.w3.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.63.w1.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.63.w2.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.63.w3.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.64.w1.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.64.w2.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.64.w3.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.65.w1.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.65.w2.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.65.w3.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.66.w1.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.66.w2.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.66.w3.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.67.w1.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.67.w2.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.67.w3.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.68.w1.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.68.w2.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.68.w3.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.69.w1.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.69.w2.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.69.w3.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.7.w1.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.7.w2.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.7.w3.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.70.w1.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.70.w2.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.70.w3.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.71.w1.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.71.w2.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.71.w3.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.72.w1.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.72.w2.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.72.w3.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.73.w1.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.73.w2.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.73.w3.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.74.w1.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.74.w2.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.74.w3.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.75.w1.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.75.w2.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.75.w3.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.76.w1.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.76.w2.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.76.w3.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.77.w1.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.77.w2.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.77.w3.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.78.w1.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.78.w2.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.78.w3.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.79.w1.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.79.w2.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.79.w3.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.8.w1.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.8.w2.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.8.w3.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.80.w1.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.80.w2.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.80.w3.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.81.w1.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.81.w2.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.81.w3.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.82.w1.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.82.w2.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.82.w3.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.83.w1.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.83.w2.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.83.w3.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.84.w1.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.84.w2.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.84.w3.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.85.w1.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.85.w2.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.85.w3.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.86.w1.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.86.w2.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.86.w3.weight": "consolidated-00037-of-00272.safetensors", + "layers.17.experts.87.w1.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.87.w2.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.87.w3.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.88.w1.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.88.w2.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.88.w3.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.89.w1.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.89.w2.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.89.w3.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.9.w1.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.9.w2.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.9.w3.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.90.w1.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.90.w2.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.90.w3.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.91.w1.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.91.w2.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.91.w3.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.92.w1.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.92.w2.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.92.w3.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.93.w1.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.93.w2.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.93.w3.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.94.w1.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.94.w2.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.94.w3.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.95.w1.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.95.w2.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.95.w3.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.96.w1.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.96.w2.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.96.w3.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.97.w1.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.97.w2.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.97.w3.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.98.w1.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.98.w2.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.98.w3.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.99.w1.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.99.w2.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.experts.99.w3.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.ffn_norm.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.gate.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.shared_experts.w1.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.shared_experts.w2.weight": "consolidated-00038-of-00272.safetensors", + "layers.17.shared_experts.w3.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.attention.kv_a_norm.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.attention.q_a_norm.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.attention.wkv_a_with_mqa.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.attention.wkv_b.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.attention.wo.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.attention.wq_a.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.attention.wq_b.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.attention_norm.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.0.w1.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.0.w2.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.0.w3.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.1.w1.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.1.w2.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.1.w3.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.10.w1.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.10.w2.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.10.w3.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.100.w1.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.100.w2.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.100.w3.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.101.w1.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.101.w2.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.101.w3.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.102.w1.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.102.w2.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.102.w3.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.103.w1.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.103.w2.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.103.w3.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.104.w1.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.104.w2.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.104.w3.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.105.w1.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.105.w2.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.105.w3.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.106.w1.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.106.w2.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.106.w3.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.107.w1.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.107.w2.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.107.w3.weight": "consolidated-00038-of-00272.safetensors", + "layers.18.experts.108.w1.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.108.w2.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.108.w3.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.109.w1.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.109.w2.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.109.w3.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.11.w1.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.11.w2.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.11.w3.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.110.w1.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.110.w2.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.110.w3.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.111.w1.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.111.w2.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.111.w3.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.112.w1.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.112.w2.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.112.w3.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.113.w1.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.113.w2.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.113.w3.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.114.w1.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.114.w2.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.114.w3.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.115.w1.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.115.w2.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.115.w3.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.116.w1.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.116.w2.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.116.w3.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.117.w1.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.117.w2.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.117.w3.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.118.w1.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.118.w2.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.118.w3.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.119.w1.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.119.w2.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.119.w3.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.12.w1.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.12.w2.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.12.w3.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.120.w1.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.120.w2.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.120.w3.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.121.w1.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.121.w2.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.121.w3.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.122.w1.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.122.w2.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.122.w3.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.123.w1.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.123.w2.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.123.w3.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.124.w1.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.124.w2.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.124.w3.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.125.w1.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.125.w2.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.125.w3.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.126.w1.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.126.w2.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.126.w3.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.127.w1.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.127.w2.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.127.w3.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.13.w1.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.13.w2.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.13.w3.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.14.w1.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.14.w2.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.14.w3.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.15.w1.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.15.w2.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.15.w3.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.16.w1.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.16.w2.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.16.w3.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.17.w1.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.17.w2.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.17.w3.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.18.w1.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.18.w2.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.18.w3.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.19.w1.weight": "consolidated-00039-of-00272.safetensors", + "layers.18.experts.19.w2.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.19.w3.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.2.w1.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.2.w2.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.2.w3.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.20.w1.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.20.w2.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.20.w3.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.21.w1.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.21.w2.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.21.w3.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.22.w1.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.22.w2.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.22.w3.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.23.w1.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.23.w2.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.23.w3.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.24.w1.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.24.w2.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.24.w3.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.25.w1.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.25.w2.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.25.w3.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.26.w1.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.26.w2.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.26.w3.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.27.w1.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.27.w2.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.27.w3.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.28.w1.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.28.w2.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.28.w3.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.29.w1.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.29.w2.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.29.w3.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.3.w1.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.3.w2.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.3.w3.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.30.w1.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.30.w2.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.30.w3.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.31.w1.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.31.w2.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.31.w3.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.32.w1.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.32.w2.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.32.w3.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.33.w1.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.33.w2.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.33.w3.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.34.w1.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.34.w2.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.34.w3.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.35.w1.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.35.w2.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.35.w3.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.36.w1.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.36.w2.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.36.w3.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.37.w1.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.37.w2.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.37.w3.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.38.w1.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.38.w2.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.38.w3.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.39.w1.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.39.w2.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.39.w3.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.4.w1.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.4.w2.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.4.w3.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.40.w1.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.40.w2.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.40.w3.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.41.w1.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.41.w2.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.41.w3.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.42.w1.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.42.w2.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.42.w3.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.43.w1.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.43.w2.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.43.w3.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.44.w1.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.44.w2.weight": "consolidated-00040-of-00272.safetensors", + "layers.18.experts.44.w3.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.45.w1.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.45.w2.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.45.w3.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.46.w1.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.46.w2.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.46.w3.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.47.w1.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.47.w2.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.47.w3.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.48.w1.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.48.w2.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.48.w3.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.49.w1.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.49.w2.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.49.w3.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.5.w1.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.5.w2.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.5.w3.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.50.w1.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.50.w2.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.50.w3.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.51.w1.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.51.w2.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.51.w3.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.52.w1.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.52.w2.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.52.w3.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.53.w1.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.53.w2.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.53.w3.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.54.w1.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.54.w2.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.54.w3.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.55.w1.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.55.w2.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.55.w3.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.56.w1.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.56.w2.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.56.w3.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.57.w1.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.57.w2.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.57.w3.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.58.w1.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.58.w2.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.58.w3.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.59.w1.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.59.w2.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.59.w3.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.6.w1.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.6.w2.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.6.w3.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.60.w1.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.60.w2.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.60.w3.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.61.w1.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.61.w2.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.61.w3.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.62.w1.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.62.w2.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.62.w3.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.63.w1.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.63.w2.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.63.w3.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.64.w1.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.64.w2.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.64.w3.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.65.w1.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.65.w2.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.65.w3.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.66.w1.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.66.w2.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.66.w3.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.67.w1.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.67.w2.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.67.w3.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.68.w1.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.68.w2.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.68.w3.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.69.w1.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.69.w2.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.69.w3.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.7.w1.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.7.w2.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.7.w3.weight": "consolidated-00041-of-00272.safetensors", + "layers.18.experts.70.w1.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.70.w2.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.70.w3.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.71.w1.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.71.w2.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.71.w3.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.72.w1.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.72.w2.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.72.w3.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.73.w1.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.73.w2.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.73.w3.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.74.w1.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.74.w2.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.74.w3.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.75.w1.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.75.w2.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.75.w3.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.76.w1.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.76.w2.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.76.w3.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.77.w1.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.77.w2.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.77.w3.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.78.w1.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.78.w2.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.78.w3.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.79.w1.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.79.w2.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.79.w3.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.8.w1.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.8.w2.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.8.w3.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.80.w1.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.80.w2.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.80.w3.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.81.w1.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.81.w2.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.81.w3.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.82.w1.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.82.w2.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.82.w3.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.83.w1.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.83.w2.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.83.w3.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.84.w1.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.84.w2.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.84.w3.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.85.w1.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.85.w2.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.85.w3.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.86.w1.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.86.w2.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.86.w3.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.87.w1.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.87.w2.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.87.w3.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.88.w1.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.88.w2.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.88.w3.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.89.w1.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.89.w2.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.89.w3.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.9.w1.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.9.w2.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.9.w3.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.90.w1.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.90.w2.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.90.w3.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.91.w1.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.91.w2.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.91.w3.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.92.w1.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.92.w2.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.92.w3.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.93.w1.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.93.w2.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.93.w3.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.94.w1.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.94.w2.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.94.w3.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.95.w1.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.95.w2.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.95.w3.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.96.w1.weight": "consolidated-00042-of-00272.safetensors", + "layers.18.experts.96.w2.weight": "consolidated-00043-of-00272.safetensors", + "layers.18.experts.96.w3.weight": "consolidated-00043-of-00272.safetensors", + "layers.18.experts.97.w1.weight": "consolidated-00043-of-00272.safetensors", + "layers.18.experts.97.w2.weight": "consolidated-00043-of-00272.safetensors", + "layers.18.experts.97.w3.weight": "consolidated-00043-of-00272.safetensors", + "layers.18.experts.98.w1.weight": "consolidated-00043-of-00272.safetensors", + "layers.18.experts.98.w2.weight": "consolidated-00043-of-00272.safetensors", + "layers.18.experts.98.w3.weight": "consolidated-00043-of-00272.safetensors", + "layers.18.experts.99.w1.weight": "consolidated-00043-of-00272.safetensors", + "layers.18.experts.99.w2.weight": "consolidated-00043-of-00272.safetensors", + "layers.18.experts.99.w3.weight": "consolidated-00043-of-00272.safetensors", + "layers.18.ffn_norm.weight": "consolidated-00043-of-00272.safetensors", + "layers.18.gate.weight": "consolidated-00043-of-00272.safetensors", + "layers.18.shared_experts.w1.weight": "consolidated-00043-of-00272.safetensors", + "layers.18.shared_experts.w2.weight": "consolidated-00043-of-00272.safetensors", + "layers.18.shared_experts.w3.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.attention.kv_a_norm.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.attention.q_a_norm.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.attention.wkv_a_with_mqa.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.attention.wkv_b.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.attention.wo.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.attention.wq_a.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.attention.wq_b.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.attention_norm.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.0.w1.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.0.w2.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.0.w3.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.1.w1.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.1.w2.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.1.w3.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.10.w1.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.10.w2.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.10.w3.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.100.w1.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.100.w2.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.100.w3.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.101.w1.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.101.w2.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.101.w3.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.102.w1.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.102.w2.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.102.w3.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.103.w1.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.103.w2.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.103.w3.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.104.w1.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.104.w2.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.104.w3.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.105.w1.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.105.w2.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.105.w3.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.106.w1.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.106.w2.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.106.w3.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.107.w1.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.107.w2.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.107.w3.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.108.w1.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.108.w2.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.108.w3.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.109.w1.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.109.w2.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.109.w3.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.11.w1.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.11.w2.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.11.w3.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.110.w1.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.110.w2.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.110.w3.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.111.w1.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.111.w2.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.111.w3.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.112.w1.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.112.w2.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.112.w3.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.113.w1.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.113.w2.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.113.w3.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.114.w1.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.114.w2.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.114.w3.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.115.w1.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.115.w2.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.115.w3.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.116.w1.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.116.w2.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.116.w3.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.117.w1.weight": "consolidated-00043-of-00272.safetensors", + "layers.19.experts.117.w2.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.117.w3.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.118.w1.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.118.w2.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.118.w3.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.119.w1.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.119.w2.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.119.w3.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.12.w1.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.12.w2.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.12.w3.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.120.w1.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.120.w2.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.120.w3.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.121.w1.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.121.w2.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.121.w3.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.122.w1.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.122.w2.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.122.w3.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.123.w1.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.123.w2.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.123.w3.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.124.w1.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.124.w2.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.124.w3.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.125.w1.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.125.w2.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.125.w3.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.126.w1.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.126.w2.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.126.w3.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.127.w1.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.127.w2.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.127.w3.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.13.w1.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.13.w2.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.13.w3.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.14.w1.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.14.w2.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.14.w3.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.15.w1.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.15.w2.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.15.w3.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.16.w1.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.16.w2.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.16.w3.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.17.w1.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.17.w2.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.17.w3.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.18.w1.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.18.w2.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.18.w3.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.19.w1.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.19.w2.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.19.w3.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.2.w1.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.2.w2.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.2.w3.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.20.w1.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.20.w2.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.20.w3.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.21.w1.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.21.w2.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.21.w3.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.22.w1.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.22.w2.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.22.w3.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.23.w1.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.23.w2.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.23.w3.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.24.w1.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.24.w2.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.24.w3.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.25.w1.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.25.w2.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.25.w3.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.26.w1.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.26.w2.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.26.w3.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.27.w1.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.27.w2.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.27.w3.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.28.w1.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.28.w2.weight": "consolidated-00044-of-00272.safetensors", + "layers.19.experts.28.w3.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.29.w1.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.29.w2.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.29.w3.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.3.w1.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.3.w2.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.3.w3.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.30.w1.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.30.w2.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.30.w3.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.31.w1.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.31.w2.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.31.w3.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.32.w1.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.32.w2.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.32.w3.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.33.w1.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.33.w2.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.33.w3.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.34.w1.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.34.w2.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.34.w3.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.35.w1.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.35.w2.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.35.w3.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.36.w1.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.36.w2.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.36.w3.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.37.w1.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.37.w2.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.37.w3.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.38.w1.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.38.w2.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.38.w3.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.39.w1.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.39.w2.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.39.w3.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.4.w1.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.4.w2.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.4.w3.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.40.w1.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.40.w2.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.40.w3.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.41.w1.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.41.w2.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.41.w3.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.42.w1.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.42.w2.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.42.w3.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.43.w1.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.43.w2.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.43.w3.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.44.w1.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.44.w2.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.44.w3.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.45.w1.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.45.w2.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.45.w3.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.46.w1.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.46.w2.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.46.w3.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.47.w1.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.47.w2.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.47.w3.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.48.w1.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.48.w2.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.48.w3.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.49.w1.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.49.w2.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.49.w3.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.5.w1.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.5.w2.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.5.w3.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.50.w1.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.50.w2.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.50.w3.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.51.w1.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.51.w2.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.51.w3.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.52.w1.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.52.w2.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.52.w3.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.53.w1.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.53.w2.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.53.w3.weight": "consolidated-00045-of-00272.safetensors", + "layers.19.experts.54.w1.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.54.w2.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.54.w3.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.55.w1.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.55.w2.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.55.w3.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.56.w1.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.56.w2.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.56.w3.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.57.w1.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.57.w2.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.57.w3.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.58.w1.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.58.w2.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.58.w3.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.59.w1.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.59.w2.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.59.w3.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.6.w1.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.6.w2.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.6.w3.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.60.w1.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.60.w2.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.60.w3.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.61.w1.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.61.w2.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.61.w3.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.62.w1.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.62.w2.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.62.w3.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.63.w1.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.63.w2.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.63.w3.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.64.w1.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.64.w2.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.64.w3.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.65.w1.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.65.w2.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.65.w3.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.66.w1.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.66.w2.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.66.w3.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.67.w1.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.67.w2.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.67.w3.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.68.w1.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.68.w2.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.68.w3.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.69.w1.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.69.w2.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.69.w3.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.7.w1.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.7.w2.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.7.w3.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.70.w1.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.70.w2.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.70.w3.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.71.w1.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.71.w2.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.71.w3.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.72.w1.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.72.w2.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.72.w3.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.73.w1.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.73.w2.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.73.w3.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.74.w1.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.74.w2.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.74.w3.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.75.w1.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.75.w2.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.75.w3.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.76.w1.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.76.w2.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.76.w3.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.77.w1.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.77.w2.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.77.w3.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.78.w1.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.78.w2.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.78.w3.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.79.w1.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.79.w2.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.79.w3.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.8.w1.weight": "consolidated-00046-of-00272.safetensors", + "layers.19.experts.8.w2.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.8.w3.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.80.w1.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.80.w2.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.80.w3.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.81.w1.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.81.w2.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.81.w3.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.82.w1.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.82.w2.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.82.w3.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.83.w1.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.83.w2.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.83.w3.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.84.w1.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.84.w2.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.84.w3.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.85.w1.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.85.w2.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.85.w3.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.86.w1.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.86.w2.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.86.w3.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.87.w1.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.87.w2.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.87.w3.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.88.w1.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.88.w2.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.88.w3.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.89.w1.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.89.w2.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.89.w3.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.9.w1.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.9.w2.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.9.w3.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.90.w1.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.90.w2.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.90.w3.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.91.w1.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.91.w2.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.91.w3.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.92.w1.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.92.w2.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.92.w3.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.93.w1.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.93.w2.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.93.w3.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.94.w1.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.94.w2.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.94.w3.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.95.w1.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.95.w2.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.95.w3.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.96.w1.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.96.w2.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.96.w3.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.97.w1.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.97.w2.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.97.w3.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.98.w1.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.98.w2.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.98.w3.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.99.w1.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.99.w2.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.experts.99.w3.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.ffn_norm.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.gate.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.shared_experts.w1.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.shared_experts.w2.weight": "consolidated-00047-of-00272.safetensors", + "layers.19.shared_experts.w3.weight": "consolidated-00047-of-00272.safetensors", + "layers.2.attention.kv_a_norm.weight": "consolidated-00047-of-00272.safetensors", + "layers.2.attention.q_a_norm.weight": "consolidated-00047-of-00272.safetensors", + "layers.2.attention.wkv_a_with_mqa.weight": "consolidated-00047-of-00272.safetensors", + "layers.2.attention.wkv_b.weight": "consolidated-00047-of-00272.safetensors", + "layers.2.attention.wo.weight": "consolidated-00047-of-00272.safetensors", + "layers.2.attention.wq_a.weight": "consolidated-00047-of-00272.safetensors", + "layers.2.attention.wq_b.weight": "consolidated-00047-of-00272.safetensors", + "layers.2.attention_norm.weight": "consolidated-00047-of-00272.safetensors", + "layers.2.feed_forward.w1.weight": "consolidated-00047-of-00272.safetensors", + "layers.2.feed_forward.w2.weight": "consolidated-00047-of-00272.safetensors", + "layers.2.feed_forward.w3.weight": "consolidated-00048-of-00272.safetensors", + "layers.2.ffn_norm.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.attention.kv_a_norm.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.attention.q_a_norm.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.attention.wkv_a_with_mqa.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.attention.wkv_b.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.attention.wo.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.attention.wq_a.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.attention.wq_b.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.attention_norm.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.0.w1.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.0.w2.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.0.w3.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.1.w1.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.1.w2.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.1.w3.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.10.w1.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.10.w2.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.10.w3.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.100.w1.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.100.w2.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.100.w3.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.101.w1.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.101.w2.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.101.w3.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.102.w1.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.102.w2.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.102.w3.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.103.w1.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.103.w2.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.103.w3.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.104.w1.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.104.w2.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.104.w3.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.105.w1.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.105.w2.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.105.w3.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.106.w1.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.106.w2.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.106.w3.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.107.w1.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.107.w2.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.107.w3.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.108.w1.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.108.w2.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.108.w3.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.109.w1.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.109.w2.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.109.w3.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.11.w1.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.11.w2.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.11.w3.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.110.w1.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.110.w2.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.110.w3.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.111.w1.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.111.w2.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.111.w3.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.112.w1.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.112.w2.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.112.w3.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.113.w1.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.113.w2.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.113.w3.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.114.w1.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.114.w2.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.114.w3.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.115.w1.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.115.w2.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.115.w3.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.116.w1.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.116.w2.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.116.w3.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.117.w1.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.117.w2.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.117.w3.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.118.w1.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.118.w2.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.118.w3.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.119.w1.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.119.w2.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.119.w3.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.12.w1.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.12.w2.weight": "consolidated-00048-of-00272.safetensors", + "layers.20.experts.12.w3.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.120.w1.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.120.w2.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.120.w3.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.121.w1.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.121.w2.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.121.w3.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.122.w1.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.122.w2.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.122.w3.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.123.w1.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.123.w2.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.123.w3.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.124.w1.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.124.w2.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.124.w3.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.125.w1.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.125.w2.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.125.w3.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.126.w1.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.126.w2.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.126.w3.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.127.w1.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.127.w2.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.127.w3.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.13.w1.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.13.w2.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.13.w3.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.14.w1.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.14.w2.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.14.w3.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.15.w1.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.15.w2.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.15.w3.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.16.w1.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.16.w2.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.16.w3.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.17.w1.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.17.w2.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.17.w3.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.18.w1.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.18.w2.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.18.w3.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.19.w1.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.19.w2.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.19.w3.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.2.w1.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.2.w2.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.2.w3.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.20.w1.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.20.w2.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.20.w3.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.21.w1.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.21.w2.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.21.w3.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.22.w1.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.22.w2.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.22.w3.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.23.w1.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.23.w2.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.23.w3.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.24.w1.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.24.w2.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.24.w3.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.25.w1.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.25.w2.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.25.w3.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.26.w1.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.26.w2.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.26.w3.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.27.w1.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.27.w2.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.27.w3.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.28.w1.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.28.w2.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.28.w3.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.29.w1.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.29.w2.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.29.w3.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.3.w1.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.3.w2.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.3.w3.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.30.w1.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.30.w2.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.30.w3.weight": "consolidated-00049-of-00272.safetensors", + "layers.20.experts.31.w1.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.31.w2.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.31.w3.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.32.w1.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.32.w2.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.32.w3.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.33.w1.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.33.w2.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.33.w3.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.34.w1.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.34.w2.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.34.w3.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.35.w1.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.35.w2.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.35.w3.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.36.w1.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.36.w2.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.36.w3.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.37.w1.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.37.w2.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.37.w3.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.38.w1.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.38.w2.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.38.w3.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.39.w1.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.39.w2.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.39.w3.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.4.w1.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.4.w2.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.4.w3.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.40.w1.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.40.w2.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.40.w3.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.41.w1.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.41.w2.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.41.w3.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.42.w1.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.42.w2.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.42.w3.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.43.w1.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.43.w2.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.43.w3.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.44.w1.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.44.w2.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.44.w3.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.45.w1.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.45.w2.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.45.w3.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.46.w1.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.46.w2.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.46.w3.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.47.w1.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.47.w2.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.47.w3.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.48.w1.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.48.w2.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.48.w3.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.49.w1.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.49.w2.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.49.w3.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.5.w1.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.5.w2.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.5.w3.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.50.w1.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.50.w2.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.50.w3.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.51.w1.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.51.w2.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.51.w3.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.52.w1.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.52.w2.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.52.w3.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.53.w1.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.53.w2.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.53.w3.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.54.w1.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.54.w2.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.54.w3.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.55.w1.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.55.w2.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.55.w3.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.56.w1.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.56.w2.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.56.w3.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.57.w1.weight": "consolidated-00050-of-00272.safetensors", + "layers.20.experts.57.w2.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.57.w3.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.58.w1.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.58.w2.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.58.w3.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.59.w1.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.59.w2.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.59.w3.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.6.w1.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.6.w2.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.6.w3.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.60.w1.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.60.w2.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.60.w3.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.61.w1.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.61.w2.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.61.w3.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.62.w1.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.62.w2.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.62.w3.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.63.w1.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.63.w2.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.63.w3.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.64.w1.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.64.w2.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.64.w3.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.65.w1.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.65.w2.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.65.w3.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.66.w1.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.66.w2.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.66.w3.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.67.w1.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.67.w2.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.67.w3.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.68.w1.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.68.w2.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.68.w3.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.69.w1.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.69.w2.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.69.w3.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.7.w1.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.7.w2.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.7.w3.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.70.w1.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.70.w2.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.70.w3.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.71.w1.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.71.w2.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.71.w3.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.72.w1.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.72.w2.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.72.w3.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.73.w1.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.73.w2.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.73.w3.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.74.w1.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.74.w2.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.74.w3.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.75.w1.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.75.w2.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.75.w3.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.76.w1.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.76.w2.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.76.w3.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.77.w1.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.77.w2.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.77.w3.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.78.w1.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.78.w2.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.78.w3.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.79.w1.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.79.w2.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.79.w3.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.8.w1.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.8.w2.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.8.w3.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.80.w1.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.80.w2.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.80.w3.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.81.w1.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.81.w2.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.81.w3.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.82.w1.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.82.w2.weight": "consolidated-00051-of-00272.safetensors", + "layers.20.experts.82.w3.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.83.w1.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.83.w2.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.83.w3.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.84.w1.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.84.w2.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.84.w3.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.85.w1.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.85.w2.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.85.w3.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.86.w1.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.86.w2.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.86.w3.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.87.w1.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.87.w2.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.87.w3.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.88.w1.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.88.w2.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.88.w3.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.89.w1.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.89.w2.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.89.w3.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.9.w1.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.9.w2.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.9.w3.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.90.w1.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.90.w2.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.90.w3.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.91.w1.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.91.w2.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.91.w3.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.92.w1.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.92.w2.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.92.w3.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.93.w1.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.93.w2.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.93.w3.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.94.w1.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.94.w2.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.94.w3.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.95.w1.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.95.w2.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.95.w3.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.96.w1.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.96.w2.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.96.w3.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.97.w1.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.97.w2.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.97.w3.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.98.w1.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.98.w2.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.98.w3.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.99.w1.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.99.w2.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.experts.99.w3.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.ffn_norm.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.gate.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.shared_experts.w1.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.shared_experts.w2.weight": "consolidated-00052-of-00272.safetensors", + "layers.20.shared_experts.w3.weight": "consolidated-00052-of-00272.safetensors", + "layers.21.attention.kv_a_norm.weight": "consolidated-00052-of-00272.safetensors", + "layers.21.attention.q_a_norm.weight": "consolidated-00052-of-00272.safetensors", + "layers.21.attention.wkv_a_with_mqa.weight": "consolidated-00052-of-00272.safetensors", + "layers.21.attention.wkv_b.weight": "consolidated-00052-of-00272.safetensors", + "layers.21.attention.wo.weight": "consolidated-00052-of-00272.safetensors", + "layers.21.attention.wq_a.weight": "consolidated-00052-of-00272.safetensors", + "layers.21.attention.wq_b.weight": "consolidated-00052-of-00272.safetensors", + "layers.21.attention_norm.weight": "consolidated-00052-of-00272.safetensors", + "layers.21.experts.0.w1.weight": "consolidated-00052-of-00272.safetensors", + "layers.21.experts.0.w2.weight": "consolidated-00052-of-00272.safetensors", + "layers.21.experts.0.w3.weight": "consolidated-00052-of-00272.safetensors", + "layers.21.experts.1.w1.weight": "consolidated-00052-of-00272.safetensors", + "layers.21.experts.1.w2.weight": "consolidated-00052-of-00272.safetensors", + "layers.21.experts.1.w3.weight": "consolidated-00052-of-00272.safetensors", + "layers.21.experts.10.w1.weight": "consolidated-00052-of-00272.safetensors", + "layers.21.experts.10.w2.weight": "consolidated-00052-of-00272.safetensors", + "layers.21.experts.10.w3.weight": "consolidated-00052-of-00272.safetensors", + "layers.21.experts.100.w1.weight": "consolidated-00052-of-00272.safetensors", + "layers.21.experts.100.w2.weight": "consolidated-00052-of-00272.safetensors", + "layers.21.experts.100.w3.weight": "consolidated-00052-of-00272.safetensors", + "layers.21.experts.101.w1.weight": "consolidated-00052-of-00272.safetensors", + "layers.21.experts.101.w2.weight": "consolidated-00052-of-00272.safetensors", + "layers.21.experts.101.w3.weight": "consolidated-00052-of-00272.safetensors", + "layers.21.experts.102.w1.weight": "consolidated-00052-of-00272.safetensors", + "layers.21.experts.102.w2.weight": "consolidated-00052-of-00272.safetensors", + "layers.21.experts.102.w3.weight": "consolidated-00052-of-00272.safetensors", + "layers.21.experts.103.w1.weight": "consolidated-00052-of-00272.safetensors", + "layers.21.experts.103.w2.weight": "consolidated-00052-of-00272.safetensors", + "layers.21.experts.103.w3.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.104.w1.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.104.w2.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.104.w3.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.105.w1.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.105.w2.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.105.w3.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.106.w1.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.106.w2.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.106.w3.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.107.w1.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.107.w2.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.107.w3.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.108.w1.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.108.w2.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.108.w3.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.109.w1.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.109.w2.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.109.w3.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.11.w1.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.11.w2.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.11.w3.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.110.w1.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.110.w2.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.110.w3.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.111.w1.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.111.w2.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.111.w3.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.112.w1.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.112.w2.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.112.w3.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.113.w1.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.113.w2.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.113.w3.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.114.w1.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.114.w2.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.114.w3.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.115.w1.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.115.w2.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.115.w3.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.116.w1.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.116.w2.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.116.w3.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.117.w1.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.117.w2.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.117.w3.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.118.w1.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.118.w2.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.118.w3.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.119.w1.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.119.w2.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.119.w3.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.12.w1.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.12.w2.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.12.w3.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.120.w1.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.120.w2.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.120.w3.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.121.w1.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.121.w2.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.121.w3.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.122.w1.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.122.w2.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.122.w3.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.123.w1.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.123.w2.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.123.w3.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.124.w1.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.124.w2.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.124.w3.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.125.w1.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.125.w2.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.125.w3.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.126.w1.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.126.w2.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.126.w3.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.127.w1.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.127.w2.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.127.w3.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.13.w1.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.13.w2.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.13.w3.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.14.w1.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.14.w2.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.14.w3.weight": "consolidated-00053-of-00272.safetensors", + "layers.21.experts.15.w1.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.15.w2.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.15.w3.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.16.w1.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.16.w2.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.16.w3.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.17.w1.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.17.w2.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.17.w3.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.18.w1.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.18.w2.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.18.w3.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.19.w1.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.19.w2.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.19.w3.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.2.w1.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.2.w2.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.2.w3.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.20.w1.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.20.w2.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.20.w3.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.21.w1.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.21.w2.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.21.w3.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.22.w1.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.22.w2.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.22.w3.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.23.w1.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.23.w2.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.23.w3.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.24.w1.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.24.w2.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.24.w3.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.25.w1.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.25.w2.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.25.w3.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.26.w1.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.26.w2.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.26.w3.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.27.w1.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.27.w2.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.27.w3.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.28.w1.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.28.w2.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.28.w3.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.29.w1.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.29.w2.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.29.w3.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.3.w1.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.3.w2.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.3.w3.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.30.w1.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.30.w2.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.30.w3.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.31.w1.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.31.w2.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.31.w3.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.32.w1.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.32.w2.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.32.w3.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.33.w1.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.33.w2.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.33.w3.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.34.w1.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.34.w2.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.34.w3.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.35.w1.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.35.w2.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.35.w3.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.36.w1.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.36.w2.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.36.w3.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.37.w1.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.37.w2.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.37.w3.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.38.w1.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.38.w2.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.38.w3.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.39.w1.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.39.w2.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.39.w3.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.4.w1.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.4.w2.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.4.w3.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.40.w1.weight": "consolidated-00054-of-00272.safetensors", + "layers.21.experts.40.w2.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.40.w3.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.41.w1.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.41.w2.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.41.w3.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.42.w1.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.42.w2.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.42.w3.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.43.w1.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.43.w2.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.43.w3.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.44.w1.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.44.w2.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.44.w3.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.45.w1.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.45.w2.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.45.w3.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.46.w1.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.46.w2.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.46.w3.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.47.w1.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.47.w2.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.47.w3.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.48.w1.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.48.w2.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.48.w3.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.49.w1.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.49.w2.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.49.w3.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.5.w1.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.5.w2.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.5.w3.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.50.w1.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.50.w2.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.50.w3.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.51.w1.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.51.w2.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.51.w3.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.52.w1.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.52.w2.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.52.w3.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.53.w1.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.53.w2.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.53.w3.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.54.w1.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.54.w2.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.54.w3.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.55.w1.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.55.w2.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.55.w3.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.56.w1.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.56.w2.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.56.w3.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.57.w1.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.57.w2.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.57.w3.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.58.w1.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.58.w2.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.58.w3.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.59.w1.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.59.w2.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.59.w3.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.6.w1.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.6.w2.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.6.w3.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.60.w1.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.60.w2.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.60.w3.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.61.w1.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.61.w2.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.61.w3.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.62.w1.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.62.w2.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.62.w3.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.63.w1.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.63.w2.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.63.w3.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.64.w1.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.64.w2.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.64.w3.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.65.w1.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.65.w2.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.65.w3.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.66.w1.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.66.w2.weight": "consolidated-00055-of-00272.safetensors", + "layers.21.experts.66.w3.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.67.w1.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.67.w2.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.67.w3.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.68.w1.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.68.w2.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.68.w3.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.69.w1.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.69.w2.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.69.w3.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.7.w1.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.7.w2.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.7.w3.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.70.w1.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.70.w2.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.70.w3.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.71.w1.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.71.w2.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.71.w3.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.72.w1.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.72.w2.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.72.w3.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.73.w1.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.73.w2.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.73.w3.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.74.w1.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.74.w2.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.74.w3.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.75.w1.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.75.w2.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.75.w3.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.76.w1.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.76.w2.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.76.w3.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.77.w1.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.77.w2.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.77.w3.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.78.w1.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.78.w2.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.78.w3.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.79.w1.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.79.w2.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.79.w3.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.8.w1.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.8.w2.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.8.w3.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.80.w1.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.80.w2.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.80.w3.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.81.w1.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.81.w2.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.81.w3.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.82.w1.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.82.w2.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.82.w3.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.83.w1.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.83.w2.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.83.w3.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.84.w1.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.84.w2.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.84.w3.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.85.w1.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.85.w2.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.85.w3.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.86.w1.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.86.w2.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.86.w3.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.87.w1.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.87.w2.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.87.w3.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.88.w1.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.88.w2.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.88.w3.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.89.w1.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.89.w2.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.89.w3.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.9.w1.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.9.w2.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.9.w3.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.90.w1.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.90.w2.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.90.w3.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.91.w1.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.91.w2.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.91.w3.weight": "consolidated-00056-of-00272.safetensors", + "layers.21.experts.92.w1.weight": "consolidated-00057-of-00272.safetensors", + "layers.21.experts.92.w2.weight": "consolidated-00057-of-00272.safetensors", + "layers.21.experts.92.w3.weight": "consolidated-00057-of-00272.safetensors", + "layers.21.experts.93.w1.weight": "consolidated-00057-of-00272.safetensors", + "layers.21.experts.93.w2.weight": "consolidated-00057-of-00272.safetensors", + "layers.21.experts.93.w3.weight": "consolidated-00057-of-00272.safetensors", + "layers.21.experts.94.w1.weight": "consolidated-00057-of-00272.safetensors", + "layers.21.experts.94.w2.weight": "consolidated-00057-of-00272.safetensors", + "layers.21.experts.94.w3.weight": "consolidated-00057-of-00272.safetensors", + "layers.21.experts.95.w1.weight": "consolidated-00057-of-00272.safetensors", + "layers.21.experts.95.w2.weight": "consolidated-00057-of-00272.safetensors", + "layers.21.experts.95.w3.weight": "consolidated-00057-of-00272.safetensors", + "layers.21.experts.96.w1.weight": "consolidated-00057-of-00272.safetensors", + "layers.21.experts.96.w2.weight": "consolidated-00057-of-00272.safetensors", + "layers.21.experts.96.w3.weight": "consolidated-00057-of-00272.safetensors", + "layers.21.experts.97.w1.weight": "consolidated-00057-of-00272.safetensors", + "layers.21.experts.97.w2.weight": "consolidated-00057-of-00272.safetensors", + "layers.21.experts.97.w3.weight": "consolidated-00057-of-00272.safetensors", + "layers.21.experts.98.w1.weight": "consolidated-00057-of-00272.safetensors", + "layers.21.experts.98.w2.weight": "consolidated-00057-of-00272.safetensors", + "layers.21.experts.98.w3.weight": "consolidated-00057-of-00272.safetensors", + "layers.21.experts.99.w1.weight": "consolidated-00057-of-00272.safetensors", + "layers.21.experts.99.w2.weight": "consolidated-00057-of-00272.safetensors", + "layers.21.experts.99.w3.weight": "consolidated-00057-of-00272.safetensors", + "layers.21.ffn_norm.weight": "consolidated-00057-of-00272.safetensors", + "layers.21.gate.weight": "consolidated-00057-of-00272.safetensors", + "layers.21.shared_experts.w1.weight": "consolidated-00057-of-00272.safetensors", + "layers.21.shared_experts.w2.weight": "consolidated-00057-of-00272.safetensors", + "layers.21.shared_experts.w3.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.attention.kv_a_norm.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.attention.q_a_norm.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.attention.wkv_a_with_mqa.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.attention.wkv_b.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.attention.wo.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.attention.wq_a.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.attention.wq_b.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.attention_norm.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.0.w1.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.0.w2.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.0.w3.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.1.w1.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.1.w2.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.1.w3.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.10.w1.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.10.w2.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.10.w3.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.100.w1.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.100.w2.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.100.w3.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.101.w1.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.101.w2.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.101.w3.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.102.w1.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.102.w2.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.102.w3.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.103.w1.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.103.w2.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.103.w3.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.104.w1.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.104.w2.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.104.w3.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.105.w1.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.105.w2.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.105.w3.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.106.w1.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.106.w2.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.106.w3.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.107.w1.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.107.w2.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.107.w3.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.108.w1.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.108.w2.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.108.w3.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.109.w1.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.109.w2.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.109.w3.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.11.w1.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.11.w2.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.11.w3.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.110.w1.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.110.w2.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.110.w3.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.111.w1.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.111.w2.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.111.w3.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.112.w1.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.112.w2.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.112.w3.weight": "consolidated-00057-of-00272.safetensors", + "layers.22.experts.113.w1.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.113.w2.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.113.w3.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.114.w1.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.114.w2.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.114.w3.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.115.w1.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.115.w2.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.115.w3.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.116.w1.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.116.w2.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.116.w3.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.117.w1.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.117.w2.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.117.w3.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.118.w1.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.118.w2.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.118.w3.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.119.w1.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.119.w2.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.119.w3.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.12.w1.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.12.w2.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.12.w3.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.120.w1.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.120.w2.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.120.w3.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.121.w1.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.121.w2.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.121.w3.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.122.w1.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.122.w2.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.122.w3.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.123.w1.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.123.w2.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.123.w3.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.124.w1.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.124.w2.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.124.w3.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.125.w1.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.125.w2.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.125.w3.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.126.w1.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.126.w2.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.126.w3.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.127.w1.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.127.w2.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.127.w3.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.13.w1.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.13.w2.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.13.w3.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.14.w1.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.14.w2.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.14.w3.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.15.w1.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.15.w2.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.15.w3.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.16.w1.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.16.w2.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.16.w3.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.17.w1.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.17.w2.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.17.w3.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.18.w1.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.18.w2.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.18.w3.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.19.w1.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.19.w2.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.19.w3.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.2.w1.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.2.w2.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.2.w3.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.20.w1.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.20.w2.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.20.w3.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.21.w1.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.21.w2.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.21.w3.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.22.w1.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.22.w2.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.22.w3.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.23.w1.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.23.w2.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.23.w3.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.24.w1.weight": "consolidated-00058-of-00272.safetensors", + "layers.22.experts.24.w2.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.24.w3.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.25.w1.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.25.w2.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.25.w3.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.26.w1.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.26.w2.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.26.w3.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.27.w1.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.27.w2.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.27.w3.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.28.w1.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.28.w2.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.28.w3.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.29.w1.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.29.w2.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.29.w3.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.3.w1.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.3.w2.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.3.w3.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.30.w1.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.30.w2.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.30.w3.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.31.w1.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.31.w2.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.31.w3.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.32.w1.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.32.w2.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.32.w3.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.33.w1.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.33.w2.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.33.w3.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.34.w1.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.34.w2.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.34.w3.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.35.w1.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.35.w2.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.35.w3.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.36.w1.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.36.w2.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.36.w3.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.37.w1.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.37.w2.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.37.w3.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.38.w1.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.38.w2.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.38.w3.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.39.w1.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.39.w2.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.39.w3.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.4.w1.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.4.w2.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.4.w3.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.40.w1.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.40.w2.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.40.w3.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.41.w1.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.41.w2.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.41.w3.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.42.w1.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.42.w2.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.42.w3.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.43.w1.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.43.w2.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.43.w3.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.44.w1.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.44.w2.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.44.w3.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.45.w1.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.45.w2.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.45.w3.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.46.w1.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.46.w2.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.46.w3.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.47.w1.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.47.w2.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.47.w3.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.48.w1.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.48.w2.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.48.w3.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.49.w1.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.49.w2.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.49.w3.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.5.w1.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.5.w2.weight": "consolidated-00059-of-00272.safetensors", + "layers.22.experts.5.w3.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.50.w1.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.50.w2.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.50.w3.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.51.w1.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.51.w2.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.51.w3.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.52.w1.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.52.w2.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.52.w3.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.53.w1.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.53.w2.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.53.w3.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.54.w1.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.54.w2.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.54.w3.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.55.w1.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.55.w2.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.55.w3.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.56.w1.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.56.w2.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.56.w3.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.57.w1.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.57.w2.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.57.w3.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.58.w1.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.58.w2.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.58.w3.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.59.w1.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.59.w2.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.59.w3.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.6.w1.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.6.w2.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.6.w3.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.60.w1.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.60.w2.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.60.w3.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.61.w1.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.61.w2.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.61.w3.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.62.w1.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.62.w2.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.62.w3.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.63.w1.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.63.w2.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.63.w3.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.64.w1.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.64.w2.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.64.w3.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.65.w1.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.65.w2.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.65.w3.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.66.w1.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.66.w2.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.66.w3.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.67.w1.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.67.w2.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.67.w3.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.68.w1.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.68.w2.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.68.w3.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.69.w1.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.69.w2.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.69.w3.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.7.w1.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.7.w2.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.7.w3.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.70.w1.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.70.w2.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.70.w3.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.71.w1.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.71.w2.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.71.w3.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.72.w1.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.72.w2.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.72.w3.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.73.w1.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.73.w2.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.73.w3.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.74.w1.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.74.w2.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.74.w3.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.75.w1.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.75.w2.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.75.w3.weight": "consolidated-00060-of-00272.safetensors", + "layers.22.experts.76.w1.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.76.w2.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.76.w3.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.77.w1.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.77.w2.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.77.w3.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.78.w1.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.78.w2.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.78.w3.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.79.w1.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.79.w2.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.79.w3.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.8.w1.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.8.w2.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.8.w3.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.80.w1.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.80.w2.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.80.w3.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.81.w1.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.81.w2.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.81.w3.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.82.w1.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.82.w2.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.82.w3.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.83.w1.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.83.w2.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.83.w3.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.84.w1.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.84.w2.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.84.w3.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.85.w1.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.85.w2.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.85.w3.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.86.w1.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.86.w2.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.86.w3.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.87.w1.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.87.w2.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.87.w3.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.88.w1.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.88.w2.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.88.w3.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.89.w1.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.89.w2.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.89.w3.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.9.w1.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.9.w2.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.9.w3.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.90.w1.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.90.w2.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.90.w3.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.91.w1.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.91.w2.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.91.w3.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.92.w1.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.92.w2.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.92.w3.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.93.w1.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.93.w2.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.93.w3.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.94.w1.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.94.w2.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.94.w3.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.95.w1.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.95.w2.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.95.w3.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.96.w1.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.96.w2.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.96.w3.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.97.w1.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.97.w2.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.97.w3.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.98.w1.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.98.w2.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.98.w3.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.99.w1.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.99.w2.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.experts.99.w3.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.ffn_norm.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.gate.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.shared_experts.w1.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.shared_experts.w2.weight": "consolidated-00061-of-00272.safetensors", + "layers.22.shared_experts.w3.weight": "consolidated-00061-of-00272.safetensors", + "layers.23.attention.kv_a_norm.weight": "consolidated-00061-of-00272.safetensors", + "layers.23.attention.q_a_norm.weight": "consolidated-00061-of-00272.safetensors", + "layers.23.attention.wkv_a_with_mqa.weight": "consolidated-00061-of-00272.safetensors", + "layers.23.attention.wkv_b.weight": "consolidated-00061-of-00272.safetensors", + "layers.23.attention.wo.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.attention.wq_a.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.attention.wq_b.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.attention_norm.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.0.w1.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.0.w2.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.0.w3.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.1.w1.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.1.w2.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.1.w3.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.10.w1.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.10.w2.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.10.w3.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.100.w1.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.100.w2.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.100.w3.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.101.w1.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.101.w2.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.101.w3.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.102.w1.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.102.w2.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.102.w3.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.103.w1.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.103.w2.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.103.w3.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.104.w1.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.104.w2.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.104.w3.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.105.w1.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.105.w2.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.105.w3.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.106.w1.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.106.w2.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.106.w3.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.107.w1.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.107.w2.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.107.w3.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.108.w1.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.108.w2.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.108.w3.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.109.w1.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.109.w2.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.109.w3.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.11.w1.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.11.w2.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.11.w3.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.110.w1.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.110.w2.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.110.w3.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.111.w1.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.111.w2.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.111.w3.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.112.w1.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.112.w2.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.112.w3.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.113.w1.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.113.w2.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.113.w3.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.114.w1.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.114.w2.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.114.w3.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.115.w1.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.115.w2.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.115.w3.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.116.w1.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.116.w2.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.116.w3.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.117.w1.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.117.w2.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.117.w3.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.118.w1.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.118.w2.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.118.w3.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.119.w1.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.119.w2.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.119.w3.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.12.w1.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.12.w2.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.12.w3.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.120.w1.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.120.w2.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.120.w3.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.121.w1.weight": "consolidated-00062-of-00272.safetensors", + "layers.23.experts.121.w2.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.121.w3.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.122.w1.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.122.w2.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.122.w3.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.123.w1.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.123.w2.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.123.w3.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.124.w1.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.124.w2.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.124.w3.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.125.w1.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.125.w2.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.125.w3.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.126.w1.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.126.w2.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.126.w3.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.127.w1.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.127.w2.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.127.w3.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.13.w1.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.13.w2.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.13.w3.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.14.w1.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.14.w2.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.14.w3.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.15.w1.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.15.w2.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.15.w3.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.16.w1.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.16.w2.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.16.w3.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.17.w1.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.17.w2.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.17.w3.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.18.w1.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.18.w2.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.18.w3.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.19.w1.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.19.w2.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.19.w3.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.2.w1.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.2.w2.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.2.w3.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.20.w1.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.20.w2.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.20.w3.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.21.w1.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.21.w2.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.21.w3.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.22.w1.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.22.w2.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.22.w3.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.23.w1.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.23.w2.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.23.w3.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.24.w1.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.24.w2.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.24.w3.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.25.w1.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.25.w2.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.25.w3.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.26.w1.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.26.w2.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.26.w3.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.27.w1.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.27.w2.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.27.w3.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.28.w1.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.28.w2.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.28.w3.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.29.w1.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.29.w2.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.29.w3.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.3.w1.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.3.w2.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.3.w3.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.30.w1.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.30.w2.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.30.w3.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.31.w1.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.31.w2.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.31.w3.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.32.w1.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.32.w2.weight": "consolidated-00063-of-00272.safetensors", + "layers.23.experts.32.w3.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.33.w1.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.33.w2.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.33.w3.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.34.w1.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.34.w2.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.34.w3.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.35.w1.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.35.w2.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.35.w3.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.36.w1.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.36.w2.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.36.w3.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.37.w1.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.37.w2.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.37.w3.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.38.w1.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.38.w2.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.38.w3.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.39.w1.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.39.w2.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.39.w3.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.4.w1.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.4.w2.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.4.w3.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.40.w1.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.40.w2.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.40.w3.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.41.w1.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.41.w2.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.41.w3.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.42.w1.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.42.w2.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.42.w3.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.43.w1.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.43.w2.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.43.w3.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.44.w1.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.44.w2.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.44.w3.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.45.w1.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.45.w2.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.45.w3.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.46.w1.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.46.w2.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.46.w3.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.47.w1.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.47.w2.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.47.w3.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.48.w1.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.48.w2.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.48.w3.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.49.w1.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.49.w2.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.49.w3.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.5.w1.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.5.w2.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.5.w3.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.50.w1.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.50.w2.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.50.w3.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.51.w1.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.51.w2.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.51.w3.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.52.w1.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.52.w2.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.52.w3.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.53.w1.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.53.w2.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.53.w3.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.54.w1.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.54.w2.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.54.w3.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.55.w1.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.55.w2.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.55.w3.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.56.w1.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.56.w2.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.56.w3.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.57.w1.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.57.w2.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.57.w3.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.58.w1.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.58.w2.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.58.w3.weight": "consolidated-00064-of-00272.safetensors", + "layers.23.experts.59.w1.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.59.w2.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.59.w3.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.6.w1.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.6.w2.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.6.w3.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.60.w1.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.60.w2.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.60.w3.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.61.w1.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.61.w2.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.61.w3.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.62.w1.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.62.w2.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.62.w3.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.63.w1.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.63.w2.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.63.w3.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.64.w1.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.64.w2.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.64.w3.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.65.w1.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.65.w2.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.65.w3.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.66.w1.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.66.w2.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.66.w3.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.67.w1.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.67.w2.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.67.w3.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.68.w1.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.68.w2.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.68.w3.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.69.w1.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.69.w2.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.69.w3.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.7.w1.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.7.w2.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.7.w3.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.70.w1.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.70.w2.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.70.w3.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.71.w1.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.71.w2.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.71.w3.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.72.w1.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.72.w2.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.72.w3.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.73.w1.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.73.w2.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.73.w3.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.74.w1.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.74.w2.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.74.w3.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.75.w1.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.75.w2.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.75.w3.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.76.w1.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.76.w2.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.76.w3.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.77.w1.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.77.w2.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.77.w3.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.78.w1.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.78.w2.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.78.w3.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.79.w1.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.79.w2.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.79.w3.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.8.w1.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.8.w2.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.8.w3.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.80.w1.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.80.w2.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.80.w3.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.81.w1.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.81.w2.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.81.w3.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.82.w1.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.82.w2.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.82.w3.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.83.w1.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.83.w2.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.83.w3.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.84.w1.weight": "consolidated-00065-of-00272.safetensors", + "layers.23.experts.84.w2.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.84.w3.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.85.w1.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.85.w2.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.85.w3.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.86.w1.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.86.w2.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.86.w3.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.87.w1.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.87.w2.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.87.w3.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.88.w1.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.88.w2.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.88.w3.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.89.w1.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.89.w2.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.89.w3.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.9.w1.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.9.w2.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.9.w3.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.90.w1.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.90.w2.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.90.w3.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.91.w1.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.91.w2.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.91.w3.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.92.w1.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.92.w2.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.92.w3.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.93.w1.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.93.w2.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.93.w3.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.94.w1.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.94.w2.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.94.w3.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.95.w1.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.95.w2.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.95.w3.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.96.w1.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.96.w2.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.96.w3.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.97.w1.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.97.w2.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.97.w3.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.98.w1.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.98.w2.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.98.w3.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.99.w1.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.99.w2.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.experts.99.w3.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.ffn_norm.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.gate.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.shared_experts.w1.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.shared_experts.w2.weight": "consolidated-00066-of-00272.safetensors", + "layers.23.shared_experts.w3.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.attention.kv_a_norm.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.attention.q_a_norm.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.attention.wkv_a_with_mqa.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.attention.wkv_b.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.attention.wo.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.attention.wq_a.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.attention.wq_b.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.attention_norm.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.experts.0.w1.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.experts.0.w2.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.experts.0.w3.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.experts.1.w1.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.experts.1.w2.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.experts.1.w3.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.experts.10.w1.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.experts.10.w2.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.experts.10.w3.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.experts.100.w1.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.experts.100.w2.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.experts.100.w3.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.experts.101.w1.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.experts.101.w2.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.experts.101.w3.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.experts.102.w1.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.experts.102.w2.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.experts.102.w3.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.experts.103.w1.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.experts.103.w2.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.experts.103.w3.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.experts.104.w1.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.experts.104.w2.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.experts.104.w3.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.experts.105.w1.weight": "consolidated-00066-of-00272.safetensors", + "layers.24.experts.105.w2.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.105.w3.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.106.w1.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.106.w2.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.106.w3.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.107.w1.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.107.w2.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.107.w3.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.108.w1.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.108.w2.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.108.w3.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.109.w1.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.109.w2.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.109.w3.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.11.w1.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.11.w2.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.11.w3.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.110.w1.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.110.w2.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.110.w3.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.111.w1.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.111.w2.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.111.w3.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.112.w1.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.112.w2.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.112.w3.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.113.w1.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.113.w2.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.113.w3.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.114.w1.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.114.w2.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.114.w3.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.115.w1.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.115.w2.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.115.w3.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.116.w1.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.116.w2.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.116.w3.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.117.w1.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.117.w2.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.117.w3.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.118.w1.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.118.w2.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.118.w3.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.119.w1.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.119.w2.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.119.w3.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.12.w1.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.12.w2.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.12.w3.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.120.w1.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.120.w2.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.120.w3.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.121.w1.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.121.w2.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.121.w3.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.122.w1.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.122.w2.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.122.w3.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.123.w1.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.123.w2.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.123.w3.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.124.w1.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.124.w2.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.124.w3.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.125.w1.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.125.w2.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.125.w3.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.126.w1.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.126.w2.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.126.w3.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.127.w1.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.127.w2.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.127.w3.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.13.w1.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.13.w2.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.13.w3.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.14.w1.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.14.w2.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.14.w3.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.15.w1.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.15.w2.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.15.w3.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.16.w1.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.16.w2.weight": "consolidated-00067-of-00272.safetensors", + "layers.24.experts.16.w3.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.17.w1.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.17.w2.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.17.w3.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.18.w1.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.18.w2.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.18.w3.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.19.w1.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.19.w2.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.19.w3.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.2.w1.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.2.w2.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.2.w3.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.20.w1.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.20.w2.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.20.w3.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.21.w1.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.21.w2.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.21.w3.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.22.w1.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.22.w2.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.22.w3.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.23.w1.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.23.w2.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.23.w3.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.24.w1.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.24.w2.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.24.w3.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.25.w1.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.25.w2.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.25.w3.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.26.w1.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.26.w2.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.26.w3.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.27.w1.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.27.w2.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.27.w3.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.28.w1.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.28.w2.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.28.w3.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.29.w1.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.29.w2.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.29.w3.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.3.w1.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.3.w2.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.3.w3.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.30.w1.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.30.w2.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.30.w3.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.31.w1.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.31.w2.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.31.w3.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.32.w1.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.32.w2.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.32.w3.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.33.w1.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.33.w2.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.33.w3.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.34.w1.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.34.w2.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.34.w3.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.35.w1.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.35.w2.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.35.w3.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.36.w1.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.36.w2.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.36.w3.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.37.w1.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.37.w2.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.37.w3.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.38.w1.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.38.w2.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.38.w3.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.39.w1.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.39.w2.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.39.w3.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.4.w1.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.4.w2.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.4.w3.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.40.w1.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.40.w2.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.40.w3.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.41.w1.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.41.w2.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.41.w3.weight": "consolidated-00068-of-00272.safetensors", + "layers.24.experts.42.w1.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.42.w2.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.42.w3.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.43.w1.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.43.w2.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.43.w3.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.44.w1.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.44.w2.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.44.w3.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.45.w1.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.45.w2.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.45.w3.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.46.w1.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.46.w2.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.46.w3.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.47.w1.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.47.w2.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.47.w3.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.48.w1.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.48.w2.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.48.w3.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.49.w1.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.49.w2.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.49.w3.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.5.w1.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.5.w2.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.5.w3.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.50.w1.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.50.w2.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.50.w3.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.51.w1.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.51.w2.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.51.w3.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.52.w1.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.52.w2.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.52.w3.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.53.w1.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.53.w2.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.53.w3.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.54.w1.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.54.w2.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.54.w3.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.55.w1.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.55.w2.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.55.w3.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.56.w1.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.56.w2.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.56.w3.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.57.w1.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.57.w2.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.57.w3.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.58.w1.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.58.w2.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.58.w3.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.59.w1.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.59.w2.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.59.w3.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.6.w1.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.6.w2.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.6.w3.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.60.w1.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.60.w2.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.60.w3.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.61.w1.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.61.w2.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.61.w3.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.62.w1.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.62.w2.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.62.w3.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.63.w1.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.63.w2.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.63.w3.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.64.w1.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.64.w2.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.64.w3.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.65.w1.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.65.w2.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.65.w3.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.66.w1.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.66.w2.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.66.w3.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.67.w1.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.67.w2.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.67.w3.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.68.w1.weight": "consolidated-00069-of-00272.safetensors", + "layers.24.experts.68.w2.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.68.w3.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.69.w1.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.69.w2.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.69.w3.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.7.w1.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.7.w2.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.7.w3.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.70.w1.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.70.w2.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.70.w3.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.71.w1.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.71.w2.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.71.w3.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.72.w1.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.72.w2.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.72.w3.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.73.w1.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.73.w2.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.73.w3.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.74.w1.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.74.w2.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.74.w3.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.75.w1.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.75.w2.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.75.w3.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.76.w1.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.76.w2.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.76.w3.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.77.w1.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.77.w2.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.77.w3.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.78.w1.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.78.w2.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.78.w3.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.79.w1.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.79.w2.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.79.w3.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.8.w1.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.8.w2.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.8.w3.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.80.w1.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.80.w2.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.80.w3.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.81.w1.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.81.w2.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.81.w3.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.82.w1.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.82.w2.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.82.w3.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.83.w1.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.83.w2.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.83.w3.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.84.w1.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.84.w2.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.84.w3.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.85.w1.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.85.w2.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.85.w3.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.86.w1.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.86.w2.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.86.w3.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.87.w1.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.87.w2.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.87.w3.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.88.w1.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.88.w2.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.88.w3.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.89.w1.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.89.w2.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.89.w3.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.9.w1.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.9.w2.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.9.w3.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.90.w1.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.90.w2.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.90.w3.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.91.w1.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.91.w2.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.91.w3.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.92.w1.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.92.w2.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.92.w3.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.93.w1.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.93.w2.weight": "consolidated-00070-of-00272.safetensors", + "layers.24.experts.93.w3.weight": "consolidated-00071-of-00272.safetensors", + "layers.24.experts.94.w1.weight": "consolidated-00071-of-00272.safetensors", + "layers.24.experts.94.w2.weight": "consolidated-00071-of-00272.safetensors", + "layers.24.experts.94.w3.weight": "consolidated-00071-of-00272.safetensors", + "layers.24.experts.95.w1.weight": "consolidated-00071-of-00272.safetensors", + "layers.24.experts.95.w2.weight": "consolidated-00071-of-00272.safetensors", + "layers.24.experts.95.w3.weight": "consolidated-00071-of-00272.safetensors", + "layers.24.experts.96.w1.weight": "consolidated-00071-of-00272.safetensors", + "layers.24.experts.96.w2.weight": "consolidated-00071-of-00272.safetensors", + "layers.24.experts.96.w3.weight": "consolidated-00071-of-00272.safetensors", + "layers.24.experts.97.w1.weight": "consolidated-00071-of-00272.safetensors", + "layers.24.experts.97.w2.weight": "consolidated-00071-of-00272.safetensors", + "layers.24.experts.97.w3.weight": "consolidated-00071-of-00272.safetensors", + "layers.24.experts.98.w1.weight": "consolidated-00071-of-00272.safetensors", + "layers.24.experts.98.w2.weight": "consolidated-00071-of-00272.safetensors", + "layers.24.experts.98.w3.weight": "consolidated-00071-of-00272.safetensors", + "layers.24.experts.99.w1.weight": "consolidated-00071-of-00272.safetensors", + "layers.24.experts.99.w2.weight": "consolidated-00071-of-00272.safetensors", + "layers.24.experts.99.w3.weight": "consolidated-00071-of-00272.safetensors", + "layers.24.ffn_norm.weight": "consolidated-00071-of-00272.safetensors", + "layers.24.gate.weight": "consolidated-00071-of-00272.safetensors", + "layers.24.shared_experts.w1.weight": "consolidated-00071-of-00272.safetensors", + "layers.24.shared_experts.w2.weight": "consolidated-00071-of-00272.safetensors", + "layers.24.shared_experts.w3.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.attention.kv_a_norm.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.attention.q_a_norm.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.attention.wkv_a_with_mqa.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.attention.wkv_b.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.attention.wo.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.attention.wq_a.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.attention.wq_b.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.attention_norm.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.0.w1.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.0.w2.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.0.w3.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.1.w1.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.1.w2.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.1.w3.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.10.w1.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.10.w2.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.10.w3.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.100.w1.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.100.w2.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.100.w3.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.101.w1.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.101.w2.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.101.w3.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.102.w1.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.102.w2.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.102.w3.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.103.w1.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.103.w2.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.103.w3.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.104.w1.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.104.w2.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.104.w3.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.105.w1.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.105.w2.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.105.w3.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.106.w1.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.106.w2.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.106.w3.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.107.w1.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.107.w2.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.107.w3.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.108.w1.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.108.w2.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.108.w3.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.109.w1.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.109.w2.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.109.w3.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.11.w1.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.11.w2.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.11.w3.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.110.w1.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.110.w2.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.110.w3.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.111.w1.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.111.w2.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.111.w3.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.112.w1.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.112.w2.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.112.w3.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.113.w1.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.113.w2.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.113.w3.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.114.w1.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.114.w2.weight": "consolidated-00071-of-00272.safetensors", + "layers.25.experts.114.w3.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.115.w1.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.115.w2.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.115.w3.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.116.w1.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.116.w2.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.116.w3.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.117.w1.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.117.w2.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.117.w3.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.118.w1.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.118.w2.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.118.w3.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.119.w1.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.119.w2.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.119.w3.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.12.w1.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.12.w2.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.12.w3.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.120.w1.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.120.w2.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.120.w3.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.121.w1.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.121.w2.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.121.w3.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.122.w1.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.122.w2.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.122.w3.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.123.w1.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.123.w2.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.123.w3.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.124.w1.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.124.w2.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.124.w3.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.125.w1.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.125.w2.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.125.w3.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.126.w1.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.126.w2.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.126.w3.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.127.w1.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.127.w2.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.127.w3.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.13.w1.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.13.w2.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.13.w3.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.14.w1.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.14.w2.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.14.w3.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.15.w1.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.15.w2.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.15.w3.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.16.w1.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.16.w2.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.16.w3.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.17.w1.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.17.w2.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.17.w3.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.18.w1.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.18.w2.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.18.w3.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.19.w1.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.19.w2.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.19.w3.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.2.w1.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.2.w2.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.2.w3.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.20.w1.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.20.w2.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.20.w3.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.21.w1.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.21.w2.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.21.w3.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.22.w1.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.22.w2.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.22.w3.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.23.w1.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.23.w2.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.23.w3.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.24.w1.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.24.w2.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.24.w3.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.25.w1.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.25.w2.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.25.w3.weight": "consolidated-00072-of-00272.safetensors", + "layers.25.experts.26.w1.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.26.w2.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.26.w3.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.27.w1.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.27.w2.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.27.w3.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.28.w1.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.28.w2.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.28.w3.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.29.w1.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.29.w2.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.29.w3.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.3.w1.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.3.w2.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.3.w3.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.30.w1.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.30.w2.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.30.w3.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.31.w1.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.31.w2.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.31.w3.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.32.w1.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.32.w2.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.32.w3.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.33.w1.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.33.w2.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.33.w3.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.34.w1.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.34.w2.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.34.w3.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.35.w1.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.35.w2.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.35.w3.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.36.w1.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.36.w2.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.36.w3.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.37.w1.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.37.w2.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.37.w3.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.38.w1.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.38.w2.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.38.w3.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.39.w1.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.39.w2.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.39.w3.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.4.w1.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.4.w2.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.4.w3.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.40.w1.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.40.w2.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.40.w3.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.41.w1.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.41.w2.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.41.w3.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.42.w1.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.42.w2.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.42.w3.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.43.w1.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.43.w2.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.43.w3.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.44.w1.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.44.w2.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.44.w3.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.45.w1.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.45.w2.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.45.w3.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.46.w1.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.46.w2.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.46.w3.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.47.w1.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.47.w2.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.47.w3.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.48.w1.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.48.w2.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.48.w3.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.49.w1.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.49.w2.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.49.w3.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.5.w1.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.5.w2.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.5.w3.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.50.w1.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.50.w2.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.50.w3.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.51.w1.weight": "consolidated-00073-of-00272.safetensors", + "layers.25.experts.51.w2.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.51.w3.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.52.w1.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.52.w2.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.52.w3.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.53.w1.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.53.w2.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.53.w3.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.54.w1.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.54.w2.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.54.w3.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.55.w1.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.55.w2.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.55.w3.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.56.w1.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.56.w2.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.56.w3.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.57.w1.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.57.w2.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.57.w3.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.58.w1.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.58.w2.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.58.w3.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.59.w1.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.59.w2.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.59.w3.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.6.w1.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.6.w2.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.6.w3.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.60.w1.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.60.w2.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.60.w3.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.61.w1.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.61.w2.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.61.w3.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.62.w1.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.62.w2.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.62.w3.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.63.w1.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.63.w2.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.63.w3.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.64.w1.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.64.w2.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.64.w3.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.65.w1.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.65.w2.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.65.w3.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.66.w1.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.66.w2.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.66.w3.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.67.w1.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.67.w2.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.67.w3.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.68.w1.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.68.w2.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.68.w3.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.69.w1.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.69.w2.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.69.w3.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.7.w1.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.7.w2.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.7.w3.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.70.w1.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.70.w2.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.70.w3.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.71.w1.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.71.w2.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.71.w3.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.72.w1.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.72.w2.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.72.w3.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.73.w1.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.73.w2.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.73.w3.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.74.w1.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.74.w2.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.74.w3.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.75.w1.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.75.w2.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.75.w3.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.76.w1.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.76.w2.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.76.w3.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.77.w1.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.77.w2.weight": "consolidated-00074-of-00272.safetensors", + "layers.25.experts.77.w3.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.78.w1.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.78.w2.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.78.w3.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.79.w1.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.79.w2.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.79.w3.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.8.w1.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.8.w2.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.8.w3.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.80.w1.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.80.w2.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.80.w3.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.81.w1.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.81.w2.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.81.w3.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.82.w1.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.82.w2.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.82.w3.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.83.w1.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.83.w2.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.83.w3.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.84.w1.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.84.w2.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.84.w3.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.85.w1.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.85.w2.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.85.w3.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.86.w1.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.86.w2.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.86.w3.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.87.w1.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.87.w2.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.87.w3.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.88.w1.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.88.w2.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.88.w3.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.89.w1.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.89.w2.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.89.w3.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.9.w1.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.9.w2.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.9.w3.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.90.w1.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.90.w2.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.90.w3.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.91.w1.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.91.w2.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.91.w3.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.92.w1.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.92.w2.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.92.w3.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.93.w1.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.93.w2.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.93.w3.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.94.w1.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.94.w2.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.94.w3.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.95.w1.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.95.w2.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.95.w3.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.96.w1.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.96.w2.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.96.w3.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.97.w1.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.97.w2.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.97.w3.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.98.w1.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.98.w2.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.98.w3.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.99.w1.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.99.w2.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.experts.99.w3.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.ffn_norm.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.gate.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.shared_experts.w1.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.shared_experts.w2.weight": "consolidated-00075-of-00272.safetensors", + "layers.25.shared_experts.w3.weight": "consolidated-00075-of-00272.safetensors", + "layers.26.attention.kv_a_norm.weight": "consolidated-00075-of-00272.safetensors", + "layers.26.attention.q_a_norm.weight": "consolidated-00075-of-00272.safetensors", + "layers.26.attention.wkv_a_with_mqa.weight": "consolidated-00075-of-00272.safetensors", + "layers.26.attention.wkv_b.weight": "consolidated-00075-of-00272.safetensors", + "layers.26.attention.wo.weight": "consolidated-00075-of-00272.safetensors", + "layers.26.attention.wq_a.weight": "consolidated-00075-of-00272.safetensors", + "layers.26.attention.wq_b.weight": "consolidated-00075-of-00272.safetensors", + "layers.26.attention_norm.weight": "consolidated-00075-of-00272.safetensors", + "layers.26.experts.0.w1.weight": "consolidated-00075-of-00272.safetensors", + "layers.26.experts.0.w2.weight": "consolidated-00075-of-00272.safetensors", + "layers.26.experts.0.w3.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.1.w1.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.1.w2.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.1.w3.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.10.w1.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.10.w2.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.10.w3.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.100.w1.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.100.w2.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.100.w3.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.101.w1.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.101.w2.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.101.w3.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.102.w1.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.102.w2.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.102.w3.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.103.w1.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.103.w2.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.103.w3.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.104.w1.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.104.w2.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.104.w3.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.105.w1.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.105.w2.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.105.w3.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.106.w1.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.106.w2.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.106.w3.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.107.w1.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.107.w2.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.107.w3.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.108.w1.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.108.w2.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.108.w3.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.109.w1.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.109.w2.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.109.w3.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.11.w1.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.11.w2.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.11.w3.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.110.w1.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.110.w2.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.110.w3.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.111.w1.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.111.w2.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.111.w3.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.112.w1.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.112.w2.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.112.w3.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.113.w1.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.113.w2.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.113.w3.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.114.w1.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.114.w2.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.114.w3.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.115.w1.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.115.w2.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.115.w3.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.116.w1.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.116.w2.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.116.w3.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.117.w1.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.117.w2.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.117.w3.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.118.w1.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.118.w2.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.118.w3.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.119.w1.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.119.w2.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.119.w3.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.12.w1.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.12.w2.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.12.w3.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.120.w1.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.120.w2.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.120.w3.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.121.w1.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.121.w2.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.121.w3.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.122.w1.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.122.w2.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.122.w3.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.123.w1.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.123.w2.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.123.w3.weight": "consolidated-00076-of-00272.safetensors", + "layers.26.experts.124.w1.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.124.w2.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.124.w3.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.125.w1.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.125.w2.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.125.w3.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.126.w1.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.126.w2.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.126.w3.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.127.w1.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.127.w2.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.127.w3.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.13.w1.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.13.w2.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.13.w3.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.14.w1.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.14.w2.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.14.w3.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.15.w1.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.15.w2.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.15.w3.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.16.w1.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.16.w2.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.16.w3.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.17.w1.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.17.w2.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.17.w3.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.18.w1.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.18.w2.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.18.w3.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.19.w1.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.19.w2.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.19.w3.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.2.w1.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.2.w2.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.2.w3.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.20.w1.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.20.w2.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.20.w3.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.21.w1.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.21.w2.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.21.w3.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.22.w1.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.22.w2.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.22.w3.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.23.w1.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.23.w2.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.23.w3.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.24.w1.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.24.w2.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.24.w3.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.25.w1.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.25.w2.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.25.w3.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.26.w1.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.26.w2.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.26.w3.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.27.w1.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.27.w2.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.27.w3.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.28.w1.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.28.w2.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.28.w3.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.29.w1.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.29.w2.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.29.w3.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.3.w1.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.3.w2.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.3.w3.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.30.w1.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.30.w2.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.30.w3.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.31.w1.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.31.w2.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.31.w3.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.32.w1.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.32.w2.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.32.w3.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.33.w1.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.33.w2.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.33.w3.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.34.w1.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.34.w2.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.34.w3.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.35.w1.weight": "consolidated-00077-of-00272.safetensors", + "layers.26.experts.35.w2.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.35.w3.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.36.w1.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.36.w2.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.36.w3.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.37.w1.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.37.w2.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.37.w3.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.38.w1.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.38.w2.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.38.w3.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.39.w1.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.39.w2.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.39.w3.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.4.w1.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.4.w2.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.4.w3.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.40.w1.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.40.w2.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.40.w3.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.41.w1.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.41.w2.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.41.w3.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.42.w1.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.42.w2.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.42.w3.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.43.w1.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.43.w2.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.43.w3.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.44.w1.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.44.w2.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.44.w3.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.45.w1.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.45.w2.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.45.w3.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.46.w1.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.46.w2.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.46.w3.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.47.w1.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.47.w2.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.47.w3.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.48.w1.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.48.w2.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.48.w3.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.49.w1.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.49.w2.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.49.w3.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.5.w1.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.5.w2.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.5.w3.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.50.w1.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.50.w2.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.50.w3.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.51.w1.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.51.w2.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.51.w3.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.52.w1.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.52.w2.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.52.w3.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.53.w1.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.53.w2.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.53.w3.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.54.w1.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.54.w2.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.54.w3.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.55.w1.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.55.w2.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.55.w3.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.56.w1.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.56.w2.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.56.w3.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.57.w1.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.57.w2.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.57.w3.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.58.w1.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.58.w2.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.58.w3.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.59.w1.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.59.w2.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.59.w3.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.6.w1.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.6.w2.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.6.w3.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.60.w1.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.60.w2.weight": "consolidated-00078-of-00272.safetensors", + "layers.26.experts.60.w3.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.61.w1.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.61.w2.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.61.w3.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.62.w1.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.62.w2.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.62.w3.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.63.w1.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.63.w2.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.63.w3.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.64.w1.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.64.w2.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.64.w3.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.65.w1.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.65.w2.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.65.w3.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.66.w1.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.66.w2.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.66.w3.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.67.w1.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.67.w2.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.67.w3.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.68.w1.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.68.w2.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.68.w3.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.69.w1.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.69.w2.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.69.w3.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.7.w1.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.7.w2.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.7.w3.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.70.w1.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.70.w2.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.70.w3.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.71.w1.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.71.w2.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.71.w3.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.72.w1.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.72.w2.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.72.w3.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.73.w1.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.73.w2.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.73.w3.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.74.w1.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.74.w2.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.74.w3.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.75.w1.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.75.w2.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.75.w3.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.76.w1.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.76.w2.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.76.w3.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.77.w1.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.77.w2.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.77.w3.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.78.w1.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.78.w2.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.78.w3.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.79.w1.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.79.w2.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.79.w3.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.8.w1.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.8.w2.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.8.w3.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.80.w1.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.80.w2.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.80.w3.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.81.w1.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.81.w2.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.81.w3.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.82.w1.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.82.w2.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.82.w3.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.83.w1.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.83.w2.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.83.w3.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.84.w1.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.84.w2.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.84.w3.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.85.w1.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.85.w2.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.85.w3.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.86.w1.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.86.w2.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.86.w3.weight": "consolidated-00079-of-00272.safetensors", + "layers.26.experts.87.w1.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.87.w2.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.87.w3.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.88.w1.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.88.w2.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.88.w3.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.89.w1.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.89.w2.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.89.w3.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.9.w1.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.9.w2.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.9.w3.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.90.w1.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.90.w2.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.90.w3.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.91.w1.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.91.w2.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.91.w3.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.92.w1.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.92.w2.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.92.w3.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.93.w1.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.93.w2.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.93.w3.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.94.w1.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.94.w2.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.94.w3.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.95.w1.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.95.w2.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.95.w3.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.96.w1.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.96.w2.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.96.w3.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.97.w1.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.97.w2.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.97.w3.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.98.w1.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.98.w2.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.98.w3.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.99.w1.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.99.w2.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.experts.99.w3.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.ffn_norm.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.gate.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.shared_experts.w1.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.shared_experts.w2.weight": "consolidated-00080-of-00272.safetensors", + "layers.26.shared_experts.w3.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.attention.kv_a_norm.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.attention.q_a_norm.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.attention.wkv_a_with_mqa.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.attention.wkv_b.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.attention.wo.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.attention.wq_a.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.attention.wq_b.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.attention_norm.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.0.w1.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.0.w2.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.0.w3.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.1.w1.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.1.w2.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.1.w3.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.10.w1.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.10.w2.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.10.w3.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.100.w1.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.100.w2.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.100.w3.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.101.w1.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.101.w2.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.101.w3.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.102.w1.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.102.w2.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.102.w3.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.103.w1.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.103.w2.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.103.w3.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.104.w1.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.104.w2.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.104.w3.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.105.w1.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.105.w2.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.105.w3.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.106.w1.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.106.w2.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.106.w3.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.107.w1.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.107.w2.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.107.w3.weight": "consolidated-00080-of-00272.safetensors", + "layers.27.experts.108.w1.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.108.w2.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.108.w3.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.109.w1.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.109.w2.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.109.w3.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.11.w1.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.11.w2.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.11.w3.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.110.w1.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.110.w2.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.110.w3.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.111.w1.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.111.w2.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.111.w3.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.112.w1.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.112.w2.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.112.w3.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.113.w1.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.113.w2.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.113.w3.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.114.w1.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.114.w2.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.114.w3.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.115.w1.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.115.w2.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.115.w3.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.116.w1.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.116.w2.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.116.w3.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.117.w1.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.117.w2.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.117.w3.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.118.w1.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.118.w2.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.118.w3.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.119.w1.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.119.w2.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.119.w3.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.12.w1.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.12.w2.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.12.w3.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.120.w1.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.120.w2.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.120.w3.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.121.w1.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.121.w2.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.121.w3.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.122.w1.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.122.w2.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.122.w3.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.123.w1.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.123.w2.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.123.w3.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.124.w1.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.124.w2.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.124.w3.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.125.w1.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.125.w2.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.125.w3.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.126.w1.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.126.w2.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.126.w3.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.127.w1.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.127.w2.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.127.w3.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.13.w1.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.13.w2.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.13.w3.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.14.w1.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.14.w2.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.14.w3.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.15.w1.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.15.w2.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.15.w3.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.16.w1.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.16.w2.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.16.w3.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.17.w1.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.17.w2.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.17.w3.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.18.w1.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.18.w2.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.18.w3.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.19.w1.weight": "consolidated-00081-of-00272.safetensors", + "layers.27.experts.19.w2.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.19.w3.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.2.w1.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.2.w2.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.2.w3.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.20.w1.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.20.w2.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.20.w3.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.21.w1.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.21.w2.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.21.w3.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.22.w1.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.22.w2.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.22.w3.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.23.w1.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.23.w2.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.23.w3.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.24.w1.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.24.w2.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.24.w3.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.25.w1.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.25.w2.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.25.w3.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.26.w1.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.26.w2.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.26.w3.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.27.w1.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.27.w2.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.27.w3.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.28.w1.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.28.w2.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.28.w3.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.29.w1.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.29.w2.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.29.w3.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.3.w1.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.3.w2.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.3.w3.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.30.w1.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.30.w2.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.30.w3.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.31.w1.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.31.w2.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.31.w3.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.32.w1.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.32.w2.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.32.w3.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.33.w1.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.33.w2.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.33.w3.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.34.w1.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.34.w2.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.34.w3.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.35.w1.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.35.w2.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.35.w3.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.36.w1.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.36.w2.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.36.w3.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.37.w1.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.37.w2.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.37.w3.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.38.w1.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.38.w2.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.38.w3.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.39.w1.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.39.w2.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.39.w3.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.4.w1.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.4.w2.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.4.w3.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.40.w1.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.40.w2.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.40.w3.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.41.w1.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.41.w2.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.41.w3.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.42.w1.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.42.w2.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.42.w3.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.43.w1.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.43.w2.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.43.w3.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.44.w1.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.44.w2.weight": "consolidated-00082-of-00272.safetensors", + "layers.27.experts.44.w3.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.45.w1.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.45.w2.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.45.w3.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.46.w1.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.46.w2.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.46.w3.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.47.w1.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.47.w2.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.47.w3.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.48.w1.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.48.w2.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.48.w3.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.49.w1.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.49.w2.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.49.w3.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.5.w1.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.5.w2.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.5.w3.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.50.w1.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.50.w2.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.50.w3.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.51.w1.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.51.w2.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.51.w3.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.52.w1.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.52.w2.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.52.w3.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.53.w1.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.53.w2.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.53.w3.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.54.w1.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.54.w2.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.54.w3.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.55.w1.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.55.w2.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.55.w3.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.56.w1.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.56.w2.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.56.w3.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.57.w1.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.57.w2.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.57.w3.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.58.w1.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.58.w2.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.58.w3.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.59.w1.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.59.w2.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.59.w3.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.6.w1.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.6.w2.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.6.w3.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.60.w1.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.60.w2.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.60.w3.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.61.w1.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.61.w2.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.61.w3.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.62.w1.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.62.w2.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.62.w3.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.63.w1.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.63.w2.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.63.w3.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.64.w1.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.64.w2.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.64.w3.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.65.w1.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.65.w2.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.65.w3.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.66.w1.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.66.w2.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.66.w3.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.67.w1.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.67.w2.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.67.w3.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.68.w1.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.68.w2.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.68.w3.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.69.w1.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.69.w2.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.69.w3.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.7.w1.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.7.w2.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.7.w3.weight": "consolidated-00083-of-00272.safetensors", + "layers.27.experts.70.w1.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.70.w2.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.70.w3.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.71.w1.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.71.w2.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.71.w3.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.72.w1.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.72.w2.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.72.w3.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.73.w1.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.73.w2.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.73.w3.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.74.w1.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.74.w2.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.74.w3.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.75.w1.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.75.w2.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.75.w3.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.76.w1.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.76.w2.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.76.w3.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.77.w1.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.77.w2.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.77.w3.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.78.w1.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.78.w2.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.78.w3.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.79.w1.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.79.w2.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.79.w3.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.8.w1.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.8.w2.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.8.w3.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.80.w1.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.80.w2.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.80.w3.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.81.w1.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.81.w2.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.81.w3.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.82.w1.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.82.w2.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.82.w3.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.83.w1.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.83.w2.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.83.w3.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.84.w1.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.84.w2.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.84.w3.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.85.w1.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.85.w2.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.85.w3.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.86.w1.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.86.w2.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.86.w3.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.87.w1.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.87.w2.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.87.w3.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.88.w1.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.88.w2.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.88.w3.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.89.w1.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.89.w2.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.89.w3.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.9.w1.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.9.w2.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.9.w3.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.90.w1.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.90.w2.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.90.w3.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.91.w1.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.91.w2.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.91.w3.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.92.w1.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.92.w2.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.92.w3.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.93.w1.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.93.w2.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.93.w3.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.94.w1.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.94.w2.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.94.w3.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.95.w1.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.95.w2.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.95.w3.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.96.w1.weight": "consolidated-00084-of-00272.safetensors", + "layers.27.experts.96.w2.weight": "consolidated-00085-of-00272.safetensors", + "layers.27.experts.96.w3.weight": "consolidated-00085-of-00272.safetensors", + "layers.27.experts.97.w1.weight": "consolidated-00085-of-00272.safetensors", + "layers.27.experts.97.w2.weight": "consolidated-00085-of-00272.safetensors", + "layers.27.experts.97.w3.weight": "consolidated-00085-of-00272.safetensors", + "layers.27.experts.98.w1.weight": "consolidated-00085-of-00272.safetensors", + "layers.27.experts.98.w2.weight": "consolidated-00085-of-00272.safetensors", + "layers.27.experts.98.w3.weight": "consolidated-00085-of-00272.safetensors", + "layers.27.experts.99.w1.weight": "consolidated-00085-of-00272.safetensors", + "layers.27.experts.99.w2.weight": "consolidated-00085-of-00272.safetensors", + "layers.27.experts.99.w3.weight": "consolidated-00085-of-00272.safetensors", + "layers.27.ffn_norm.weight": "consolidated-00085-of-00272.safetensors", + "layers.27.gate.weight": "consolidated-00085-of-00272.safetensors", + "layers.27.shared_experts.w1.weight": "consolidated-00085-of-00272.safetensors", + "layers.27.shared_experts.w2.weight": "consolidated-00085-of-00272.safetensors", + "layers.27.shared_experts.w3.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.attention.kv_a_norm.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.attention.q_a_norm.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.attention.wkv_a_with_mqa.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.attention.wkv_b.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.attention.wo.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.attention.wq_a.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.attention.wq_b.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.attention_norm.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.0.w1.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.0.w2.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.0.w3.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.1.w1.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.1.w2.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.1.w3.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.10.w1.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.10.w2.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.10.w3.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.100.w1.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.100.w2.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.100.w3.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.101.w1.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.101.w2.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.101.w3.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.102.w1.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.102.w2.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.102.w3.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.103.w1.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.103.w2.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.103.w3.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.104.w1.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.104.w2.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.104.w3.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.105.w1.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.105.w2.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.105.w3.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.106.w1.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.106.w2.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.106.w3.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.107.w1.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.107.w2.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.107.w3.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.108.w1.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.108.w2.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.108.w3.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.109.w1.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.109.w2.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.109.w3.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.11.w1.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.11.w2.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.11.w3.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.110.w1.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.110.w2.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.110.w3.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.111.w1.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.111.w2.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.111.w3.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.112.w1.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.112.w2.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.112.w3.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.113.w1.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.113.w2.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.113.w3.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.114.w1.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.114.w2.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.114.w3.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.115.w1.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.115.w2.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.115.w3.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.116.w1.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.116.w2.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.116.w3.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.117.w1.weight": "consolidated-00085-of-00272.safetensors", + "layers.28.experts.117.w2.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.117.w3.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.118.w1.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.118.w2.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.118.w3.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.119.w1.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.119.w2.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.119.w3.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.12.w1.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.12.w2.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.12.w3.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.120.w1.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.120.w2.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.120.w3.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.121.w1.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.121.w2.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.121.w3.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.122.w1.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.122.w2.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.122.w3.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.123.w1.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.123.w2.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.123.w3.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.124.w1.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.124.w2.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.124.w3.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.125.w1.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.125.w2.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.125.w3.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.126.w1.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.126.w2.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.126.w3.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.127.w1.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.127.w2.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.127.w3.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.13.w1.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.13.w2.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.13.w3.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.14.w1.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.14.w2.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.14.w3.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.15.w1.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.15.w2.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.15.w3.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.16.w1.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.16.w2.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.16.w3.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.17.w1.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.17.w2.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.17.w3.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.18.w1.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.18.w2.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.18.w3.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.19.w1.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.19.w2.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.19.w3.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.2.w1.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.2.w2.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.2.w3.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.20.w1.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.20.w2.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.20.w3.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.21.w1.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.21.w2.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.21.w3.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.22.w1.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.22.w2.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.22.w3.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.23.w1.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.23.w2.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.23.w3.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.24.w1.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.24.w2.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.24.w3.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.25.w1.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.25.w2.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.25.w3.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.26.w1.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.26.w2.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.26.w3.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.27.w1.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.27.w2.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.27.w3.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.28.w1.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.28.w2.weight": "consolidated-00086-of-00272.safetensors", + "layers.28.experts.28.w3.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.29.w1.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.29.w2.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.29.w3.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.3.w1.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.3.w2.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.3.w3.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.30.w1.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.30.w2.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.30.w3.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.31.w1.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.31.w2.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.31.w3.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.32.w1.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.32.w2.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.32.w3.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.33.w1.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.33.w2.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.33.w3.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.34.w1.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.34.w2.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.34.w3.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.35.w1.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.35.w2.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.35.w3.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.36.w1.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.36.w2.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.36.w3.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.37.w1.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.37.w2.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.37.w3.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.38.w1.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.38.w2.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.38.w3.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.39.w1.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.39.w2.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.39.w3.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.4.w1.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.4.w2.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.4.w3.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.40.w1.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.40.w2.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.40.w3.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.41.w1.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.41.w2.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.41.w3.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.42.w1.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.42.w2.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.42.w3.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.43.w1.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.43.w2.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.43.w3.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.44.w1.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.44.w2.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.44.w3.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.45.w1.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.45.w2.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.45.w3.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.46.w1.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.46.w2.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.46.w3.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.47.w1.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.47.w2.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.47.w3.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.48.w1.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.48.w2.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.48.w3.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.49.w1.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.49.w2.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.49.w3.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.5.w1.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.5.w2.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.5.w3.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.50.w1.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.50.w2.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.50.w3.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.51.w1.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.51.w2.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.51.w3.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.52.w1.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.52.w2.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.52.w3.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.53.w1.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.53.w2.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.53.w3.weight": "consolidated-00087-of-00272.safetensors", + "layers.28.experts.54.w1.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.54.w2.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.54.w3.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.55.w1.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.55.w2.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.55.w3.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.56.w1.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.56.w2.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.56.w3.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.57.w1.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.57.w2.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.57.w3.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.58.w1.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.58.w2.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.58.w3.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.59.w1.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.59.w2.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.59.w3.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.6.w1.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.6.w2.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.6.w3.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.60.w1.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.60.w2.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.60.w3.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.61.w1.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.61.w2.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.61.w3.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.62.w1.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.62.w2.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.62.w3.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.63.w1.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.63.w2.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.63.w3.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.64.w1.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.64.w2.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.64.w3.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.65.w1.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.65.w2.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.65.w3.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.66.w1.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.66.w2.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.66.w3.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.67.w1.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.67.w2.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.67.w3.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.68.w1.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.68.w2.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.68.w3.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.69.w1.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.69.w2.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.69.w3.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.7.w1.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.7.w2.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.7.w3.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.70.w1.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.70.w2.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.70.w3.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.71.w1.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.71.w2.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.71.w3.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.72.w1.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.72.w2.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.72.w3.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.73.w1.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.73.w2.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.73.w3.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.74.w1.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.74.w2.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.74.w3.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.75.w1.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.75.w2.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.75.w3.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.76.w1.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.76.w2.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.76.w3.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.77.w1.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.77.w2.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.77.w3.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.78.w1.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.78.w2.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.78.w3.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.79.w1.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.79.w2.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.79.w3.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.8.w1.weight": "consolidated-00088-of-00272.safetensors", + "layers.28.experts.8.w2.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.8.w3.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.80.w1.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.80.w2.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.80.w3.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.81.w1.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.81.w2.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.81.w3.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.82.w1.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.82.w2.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.82.w3.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.83.w1.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.83.w2.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.83.w3.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.84.w1.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.84.w2.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.84.w3.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.85.w1.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.85.w2.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.85.w3.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.86.w1.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.86.w2.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.86.w3.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.87.w1.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.87.w2.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.87.w3.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.88.w1.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.88.w2.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.88.w3.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.89.w1.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.89.w2.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.89.w3.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.9.w1.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.9.w2.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.9.w3.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.90.w1.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.90.w2.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.90.w3.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.91.w1.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.91.w2.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.91.w3.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.92.w1.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.92.w2.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.92.w3.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.93.w1.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.93.w2.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.93.w3.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.94.w1.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.94.w2.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.94.w3.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.95.w1.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.95.w2.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.95.w3.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.96.w1.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.96.w2.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.96.w3.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.97.w1.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.97.w2.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.97.w3.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.98.w1.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.98.w2.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.98.w3.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.99.w1.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.99.w2.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.experts.99.w3.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.ffn_norm.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.gate.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.shared_experts.w1.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.shared_experts.w2.weight": "consolidated-00089-of-00272.safetensors", + "layers.28.shared_experts.w3.weight": "consolidated-00089-of-00272.safetensors", + "layers.29.attention.kv_a_norm.weight": "consolidated-00089-of-00272.safetensors", + "layers.29.attention.q_a_norm.weight": "consolidated-00089-of-00272.safetensors", + "layers.29.attention.wkv_a_with_mqa.weight": "consolidated-00089-of-00272.safetensors", + "layers.29.attention.wkv_b.weight": "consolidated-00089-of-00272.safetensors", + "layers.29.attention.wo.weight": "consolidated-00089-of-00272.safetensors", + "layers.29.attention.wq_a.weight": "consolidated-00089-of-00272.safetensors", + "layers.29.attention.wq_b.weight": "consolidated-00089-of-00272.safetensors", + "layers.29.attention_norm.weight": "consolidated-00089-of-00272.safetensors", + "layers.29.experts.0.w1.weight": "consolidated-00089-of-00272.safetensors", + "layers.29.experts.0.w2.weight": "consolidated-00089-of-00272.safetensors", + "layers.29.experts.0.w3.weight": "consolidated-00089-of-00272.safetensors", + "layers.29.experts.1.w1.weight": "consolidated-00089-of-00272.safetensors", + "layers.29.experts.1.w2.weight": "consolidated-00089-of-00272.safetensors", + "layers.29.experts.1.w3.weight": "consolidated-00089-of-00272.safetensors", + "layers.29.experts.10.w1.weight": "consolidated-00089-of-00272.safetensors", + "layers.29.experts.10.w2.weight": "consolidated-00089-of-00272.safetensors", + "layers.29.experts.10.w3.weight": "consolidated-00089-of-00272.safetensors", + "layers.29.experts.100.w1.weight": "consolidated-00089-of-00272.safetensors", + "layers.29.experts.100.w2.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.100.w3.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.101.w1.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.101.w2.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.101.w3.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.102.w1.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.102.w2.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.102.w3.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.103.w1.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.103.w2.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.103.w3.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.104.w1.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.104.w2.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.104.w3.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.105.w1.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.105.w2.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.105.w3.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.106.w1.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.106.w2.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.106.w3.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.107.w1.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.107.w2.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.107.w3.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.108.w1.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.108.w2.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.108.w3.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.109.w1.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.109.w2.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.109.w3.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.11.w1.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.11.w2.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.11.w3.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.110.w1.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.110.w2.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.110.w3.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.111.w1.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.111.w2.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.111.w3.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.112.w1.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.112.w2.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.112.w3.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.113.w1.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.113.w2.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.113.w3.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.114.w1.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.114.w2.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.114.w3.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.115.w1.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.115.w2.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.115.w3.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.116.w1.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.116.w2.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.116.w3.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.117.w1.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.117.w2.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.117.w3.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.118.w1.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.118.w2.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.118.w3.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.119.w1.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.119.w2.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.119.w3.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.12.w1.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.12.w2.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.12.w3.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.120.w1.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.120.w2.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.120.w3.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.121.w1.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.121.w2.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.121.w3.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.122.w1.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.122.w2.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.122.w3.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.123.w1.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.123.w2.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.123.w3.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.124.w1.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.124.w2.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.124.w3.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.125.w1.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.125.w2.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.125.w3.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.126.w1.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.126.w2.weight": "consolidated-00090-of-00272.safetensors", + "layers.29.experts.126.w3.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.127.w1.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.127.w2.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.127.w3.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.13.w1.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.13.w2.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.13.w3.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.14.w1.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.14.w2.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.14.w3.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.15.w1.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.15.w2.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.15.w3.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.16.w1.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.16.w2.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.16.w3.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.17.w1.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.17.w2.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.17.w3.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.18.w1.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.18.w2.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.18.w3.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.19.w1.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.19.w2.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.19.w3.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.2.w1.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.2.w2.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.2.w3.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.20.w1.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.20.w2.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.20.w3.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.21.w1.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.21.w2.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.21.w3.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.22.w1.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.22.w2.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.22.w3.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.23.w1.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.23.w2.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.23.w3.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.24.w1.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.24.w2.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.24.w3.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.25.w1.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.25.w2.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.25.w3.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.26.w1.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.26.w2.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.26.w3.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.27.w1.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.27.w2.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.27.w3.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.28.w1.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.28.w2.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.28.w3.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.29.w1.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.29.w2.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.29.w3.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.3.w1.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.3.w2.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.3.w3.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.30.w1.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.30.w2.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.30.w3.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.31.w1.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.31.w2.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.31.w3.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.32.w1.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.32.w2.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.32.w3.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.33.w1.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.33.w2.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.33.w3.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.34.w1.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.34.w2.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.34.w3.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.35.w1.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.35.w2.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.35.w3.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.36.w1.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.36.w2.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.36.w3.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.37.w1.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.37.w2.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.37.w3.weight": "consolidated-00091-of-00272.safetensors", + "layers.29.experts.38.w1.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.38.w2.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.38.w3.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.39.w1.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.39.w2.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.39.w3.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.4.w1.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.4.w2.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.4.w3.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.40.w1.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.40.w2.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.40.w3.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.41.w1.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.41.w2.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.41.w3.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.42.w1.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.42.w2.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.42.w3.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.43.w1.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.43.w2.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.43.w3.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.44.w1.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.44.w2.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.44.w3.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.45.w1.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.45.w2.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.45.w3.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.46.w1.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.46.w2.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.46.w3.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.47.w1.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.47.w2.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.47.w3.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.48.w1.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.48.w2.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.48.w3.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.49.w1.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.49.w2.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.49.w3.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.5.w1.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.5.w2.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.5.w3.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.50.w1.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.50.w2.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.50.w3.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.51.w1.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.51.w2.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.51.w3.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.52.w1.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.52.w2.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.52.w3.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.53.w1.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.53.w2.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.53.w3.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.54.w1.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.54.w2.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.54.w3.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.55.w1.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.55.w2.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.55.w3.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.56.w1.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.56.w2.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.56.w3.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.57.w1.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.57.w2.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.57.w3.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.58.w1.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.58.w2.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.58.w3.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.59.w1.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.59.w2.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.59.w3.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.6.w1.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.6.w2.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.6.w3.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.60.w1.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.60.w2.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.60.w3.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.61.w1.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.61.w2.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.61.w3.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.62.w1.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.62.w2.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.62.w3.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.63.w1.weight": "consolidated-00092-of-00272.safetensors", + "layers.29.experts.63.w2.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.63.w3.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.64.w1.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.64.w2.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.64.w3.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.65.w1.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.65.w2.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.65.w3.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.66.w1.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.66.w2.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.66.w3.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.67.w1.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.67.w2.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.67.w3.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.68.w1.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.68.w2.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.68.w3.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.69.w1.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.69.w2.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.69.w3.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.7.w1.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.7.w2.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.7.w3.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.70.w1.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.70.w2.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.70.w3.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.71.w1.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.71.w2.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.71.w3.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.72.w1.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.72.w2.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.72.w3.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.73.w1.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.73.w2.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.73.w3.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.74.w1.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.74.w2.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.74.w3.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.75.w1.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.75.w2.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.75.w3.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.76.w1.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.76.w2.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.76.w3.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.77.w1.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.77.w2.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.77.w3.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.78.w1.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.78.w2.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.78.w3.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.79.w1.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.79.w2.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.79.w3.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.8.w1.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.8.w2.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.8.w3.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.80.w1.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.80.w2.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.80.w3.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.81.w1.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.81.w2.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.81.w3.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.82.w1.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.82.w2.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.82.w3.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.83.w1.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.83.w2.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.83.w3.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.84.w1.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.84.w2.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.84.w3.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.85.w1.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.85.w2.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.85.w3.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.86.w1.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.86.w2.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.86.w3.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.87.w1.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.87.w2.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.87.w3.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.88.w1.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.88.w2.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.88.w3.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.89.w1.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.89.w2.weight": "consolidated-00093-of-00272.safetensors", + "layers.29.experts.89.w3.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.9.w1.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.9.w2.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.9.w3.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.90.w1.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.90.w2.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.90.w3.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.91.w1.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.91.w2.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.91.w3.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.92.w1.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.92.w2.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.92.w3.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.93.w1.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.93.w2.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.93.w3.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.94.w1.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.94.w2.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.94.w3.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.95.w1.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.95.w2.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.95.w3.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.96.w1.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.96.w2.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.96.w3.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.97.w1.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.97.w2.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.97.w3.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.98.w1.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.98.w2.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.98.w3.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.99.w1.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.99.w2.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.experts.99.w3.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.ffn_norm.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.gate.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.shared_experts.w1.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.shared_experts.w2.weight": "consolidated-00094-of-00272.safetensors", + "layers.29.shared_experts.w3.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.attention.kv_a_norm.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.attention.q_a_norm.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.attention.wkv_a_with_mqa.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.attention.wkv_b.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.attention.wo.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.attention.wq_a.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.attention.wq_b.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.attention_norm.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.0.w1.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.0.w2.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.0.w3.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.1.w1.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.1.w2.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.1.w3.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.10.w1.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.10.w2.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.10.w3.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.100.w1.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.100.w2.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.100.w3.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.101.w1.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.101.w2.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.101.w3.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.102.w1.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.102.w2.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.102.w3.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.103.w1.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.103.w2.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.103.w3.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.104.w1.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.104.w2.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.104.w3.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.105.w1.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.105.w2.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.105.w3.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.106.w1.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.106.w2.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.106.w3.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.107.w1.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.107.w2.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.107.w3.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.108.w1.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.108.w2.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.108.w3.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.109.w1.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.109.w2.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.109.w3.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.11.w1.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.11.w2.weight": "consolidated-00094-of-00272.safetensors", + "layers.3.experts.11.w3.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.110.w1.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.110.w2.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.110.w3.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.111.w1.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.111.w2.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.111.w3.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.112.w1.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.112.w2.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.112.w3.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.113.w1.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.113.w2.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.113.w3.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.114.w1.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.114.w2.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.114.w3.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.115.w1.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.115.w2.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.115.w3.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.116.w1.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.116.w2.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.116.w3.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.117.w1.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.117.w2.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.117.w3.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.118.w1.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.118.w2.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.118.w3.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.119.w1.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.119.w2.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.119.w3.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.12.w1.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.12.w2.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.12.w3.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.120.w1.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.120.w2.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.120.w3.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.121.w1.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.121.w2.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.121.w3.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.122.w1.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.122.w2.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.122.w3.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.123.w1.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.123.w2.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.123.w3.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.124.w1.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.124.w2.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.124.w3.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.125.w1.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.125.w2.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.125.w3.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.126.w1.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.126.w2.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.126.w3.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.127.w1.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.127.w2.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.127.w3.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.13.w1.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.13.w2.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.13.w3.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.14.w1.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.14.w2.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.14.w3.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.15.w1.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.15.w2.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.15.w3.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.16.w1.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.16.w2.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.16.w3.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.17.w1.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.17.w2.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.17.w3.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.18.w1.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.18.w2.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.18.w3.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.19.w1.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.19.w2.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.19.w3.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.2.w1.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.2.w2.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.2.w3.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.20.w1.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.20.w2.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.20.w3.weight": "consolidated-00095-of-00272.safetensors", + "layers.3.experts.21.w1.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.21.w2.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.21.w3.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.22.w1.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.22.w2.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.22.w3.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.23.w1.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.23.w2.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.23.w3.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.24.w1.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.24.w2.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.24.w3.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.25.w1.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.25.w2.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.25.w3.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.26.w1.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.26.w2.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.26.w3.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.27.w1.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.27.w2.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.27.w3.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.28.w1.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.28.w2.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.28.w3.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.29.w1.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.29.w2.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.29.w3.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.3.w1.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.3.w2.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.3.w3.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.30.w1.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.30.w2.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.30.w3.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.31.w1.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.31.w2.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.31.w3.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.32.w1.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.32.w2.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.32.w3.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.33.w1.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.33.w2.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.33.w3.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.34.w1.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.34.w2.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.34.w3.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.35.w1.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.35.w2.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.35.w3.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.36.w1.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.36.w2.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.36.w3.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.37.w1.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.37.w2.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.37.w3.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.38.w1.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.38.w2.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.38.w3.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.39.w1.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.39.w2.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.39.w3.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.4.w1.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.4.w2.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.4.w3.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.40.w1.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.40.w2.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.40.w3.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.41.w1.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.41.w2.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.41.w3.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.42.w1.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.42.w2.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.42.w3.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.43.w1.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.43.w2.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.43.w3.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.44.w1.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.44.w2.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.44.w3.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.45.w1.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.45.w2.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.45.w3.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.46.w1.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.46.w2.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.46.w3.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.47.w1.weight": "consolidated-00096-of-00272.safetensors", + "layers.3.experts.47.w2.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.47.w3.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.48.w1.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.48.w2.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.48.w3.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.49.w1.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.49.w2.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.49.w3.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.5.w1.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.5.w2.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.5.w3.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.50.w1.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.50.w2.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.50.w3.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.51.w1.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.51.w2.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.51.w3.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.52.w1.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.52.w2.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.52.w3.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.53.w1.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.53.w2.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.53.w3.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.54.w1.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.54.w2.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.54.w3.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.55.w1.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.55.w2.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.55.w3.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.56.w1.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.56.w2.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.56.w3.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.57.w1.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.57.w2.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.57.w3.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.58.w1.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.58.w2.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.58.w3.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.59.w1.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.59.w2.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.59.w3.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.6.w1.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.6.w2.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.6.w3.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.60.w1.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.60.w2.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.60.w3.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.61.w1.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.61.w2.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.61.w3.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.62.w1.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.62.w2.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.62.w3.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.63.w1.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.63.w2.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.63.w3.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.64.w1.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.64.w2.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.64.w3.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.65.w1.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.65.w2.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.65.w3.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.66.w1.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.66.w2.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.66.w3.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.67.w1.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.67.w2.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.67.w3.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.68.w1.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.68.w2.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.68.w3.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.69.w1.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.69.w2.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.69.w3.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.7.w1.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.7.w2.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.7.w3.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.70.w1.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.70.w2.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.70.w3.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.71.w1.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.71.w2.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.71.w3.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.72.w1.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.72.w2.weight": "consolidated-00097-of-00272.safetensors", + "layers.3.experts.72.w3.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.73.w1.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.73.w2.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.73.w3.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.74.w1.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.74.w2.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.74.w3.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.75.w1.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.75.w2.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.75.w3.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.76.w1.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.76.w2.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.76.w3.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.77.w1.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.77.w2.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.77.w3.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.78.w1.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.78.w2.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.78.w3.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.79.w1.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.79.w2.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.79.w3.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.8.w1.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.8.w2.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.8.w3.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.80.w1.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.80.w2.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.80.w3.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.81.w1.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.81.w2.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.81.w3.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.82.w1.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.82.w2.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.82.w3.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.83.w1.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.83.w2.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.83.w3.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.84.w1.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.84.w2.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.84.w3.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.85.w1.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.85.w2.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.85.w3.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.86.w1.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.86.w2.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.86.w3.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.87.w1.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.87.w2.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.87.w3.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.88.w1.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.88.w2.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.88.w3.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.89.w1.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.89.w2.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.89.w3.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.9.w1.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.9.w2.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.9.w3.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.90.w1.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.90.w2.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.90.w3.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.91.w1.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.91.w2.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.91.w3.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.92.w1.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.92.w2.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.92.w3.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.93.w1.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.93.w2.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.93.w3.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.94.w1.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.94.w2.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.94.w3.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.95.w1.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.95.w2.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.95.w3.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.96.w1.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.96.w2.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.96.w3.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.97.w1.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.97.w2.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.97.w3.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.98.w1.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.98.w2.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.98.w3.weight": "consolidated-00098-of-00272.safetensors", + "layers.3.experts.99.w1.weight": "consolidated-00099-of-00272.safetensors", + "layers.3.experts.99.w2.weight": "consolidated-00099-of-00272.safetensors", + "layers.3.experts.99.w3.weight": "consolidated-00099-of-00272.safetensors", + "layers.3.ffn_norm.weight": "consolidated-00099-of-00272.safetensors", + "layers.3.gate.weight": "consolidated-00099-of-00272.safetensors", + "layers.3.shared_experts.w1.weight": "consolidated-00099-of-00272.safetensors", + "layers.3.shared_experts.w2.weight": "consolidated-00099-of-00272.safetensors", + "layers.3.shared_experts.w3.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.attention.kv_a_norm.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.attention.q_a_norm.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.attention.wkv_a_with_mqa.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.attention.wkv_b.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.attention.wo.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.attention.wq_a.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.attention.wq_b.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.attention_norm.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.0.w1.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.0.w2.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.0.w3.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.1.w1.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.1.w2.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.1.w3.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.10.w1.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.10.w2.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.10.w3.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.100.w1.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.100.w2.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.100.w3.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.101.w1.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.101.w2.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.101.w3.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.102.w1.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.102.w2.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.102.w3.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.103.w1.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.103.w2.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.103.w3.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.104.w1.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.104.w2.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.104.w3.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.105.w1.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.105.w2.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.105.w3.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.106.w1.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.106.w2.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.106.w3.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.107.w1.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.107.w2.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.107.w3.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.108.w1.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.108.w2.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.108.w3.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.109.w1.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.109.w2.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.109.w3.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.11.w1.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.11.w2.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.11.w3.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.110.w1.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.110.w2.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.110.w3.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.111.w1.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.111.w2.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.111.w3.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.112.w1.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.112.w2.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.112.w3.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.113.w1.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.113.w2.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.113.w3.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.114.w1.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.114.w2.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.114.w3.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.115.w1.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.115.w2.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.115.w3.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.116.w1.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.116.w2.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.116.w3.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.117.w1.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.117.w2.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.117.w3.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.118.w1.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.118.w2.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.118.w3.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.119.w1.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.119.w2.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.119.w3.weight": "consolidated-00099-of-00272.safetensors", + "layers.30.experts.12.w1.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.12.w2.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.12.w3.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.120.w1.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.120.w2.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.120.w3.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.121.w1.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.121.w2.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.121.w3.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.122.w1.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.122.w2.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.122.w3.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.123.w1.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.123.w2.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.123.w3.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.124.w1.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.124.w2.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.124.w3.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.125.w1.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.125.w2.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.125.w3.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.126.w1.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.126.w2.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.126.w3.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.127.w1.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.127.w2.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.127.w3.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.13.w1.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.13.w2.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.13.w3.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.14.w1.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.14.w2.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.14.w3.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.15.w1.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.15.w2.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.15.w3.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.16.w1.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.16.w2.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.16.w3.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.17.w1.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.17.w2.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.17.w3.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.18.w1.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.18.w2.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.18.w3.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.19.w1.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.19.w2.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.19.w3.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.2.w1.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.2.w2.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.2.w3.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.20.w1.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.20.w2.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.20.w3.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.21.w1.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.21.w2.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.21.w3.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.22.w1.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.22.w2.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.22.w3.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.23.w1.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.23.w2.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.23.w3.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.24.w1.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.24.w2.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.24.w3.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.25.w1.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.25.w2.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.25.w3.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.26.w1.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.26.w2.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.26.w3.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.27.w1.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.27.w2.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.27.w3.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.28.w1.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.28.w2.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.28.w3.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.29.w1.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.29.w2.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.29.w3.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.3.w1.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.3.w2.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.3.w3.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.30.w1.weight": "consolidated-00100-of-00272.safetensors", + "layers.30.experts.30.w2.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.30.w3.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.31.w1.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.31.w2.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.31.w3.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.32.w1.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.32.w2.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.32.w3.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.33.w1.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.33.w2.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.33.w3.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.34.w1.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.34.w2.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.34.w3.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.35.w1.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.35.w2.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.35.w3.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.36.w1.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.36.w2.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.36.w3.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.37.w1.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.37.w2.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.37.w3.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.38.w1.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.38.w2.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.38.w3.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.39.w1.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.39.w2.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.39.w3.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.4.w1.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.4.w2.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.4.w3.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.40.w1.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.40.w2.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.40.w3.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.41.w1.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.41.w2.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.41.w3.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.42.w1.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.42.w2.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.42.w3.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.43.w1.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.43.w2.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.43.w3.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.44.w1.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.44.w2.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.44.w3.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.45.w1.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.45.w2.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.45.w3.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.46.w1.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.46.w2.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.46.w3.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.47.w1.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.47.w2.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.47.w3.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.48.w1.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.48.w2.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.48.w3.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.49.w1.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.49.w2.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.49.w3.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.5.w1.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.5.w2.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.5.w3.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.50.w1.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.50.w2.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.50.w3.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.51.w1.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.51.w2.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.51.w3.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.52.w1.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.52.w2.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.52.w3.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.53.w1.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.53.w2.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.53.w3.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.54.w1.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.54.w2.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.54.w3.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.55.w1.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.55.w2.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.55.w3.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.56.w1.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.56.w2.weight": "consolidated-00101-of-00272.safetensors", + "layers.30.experts.56.w3.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.57.w1.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.57.w2.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.57.w3.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.58.w1.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.58.w2.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.58.w3.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.59.w1.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.59.w2.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.59.w3.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.6.w1.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.6.w2.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.6.w3.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.60.w1.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.60.w2.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.60.w3.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.61.w1.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.61.w2.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.61.w3.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.62.w1.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.62.w2.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.62.w3.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.63.w1.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.63.w2.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.63.w3.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.64.w1.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.64.w2.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.64.w3.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.65.w1.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.65.w2.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.65.w3.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.66.w1.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.66.w2.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.66.w3.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.67.w1.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.67.w2.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.67.w3.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.68.w1.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.68.w2.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.68.w3.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.69.w1.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.69.w2.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.69.w3.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.7.w1.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.7.w2.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.7.w3.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.70.w1.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.70.w2.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.70.w3.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.71.w1.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.71.w2.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.71.w3.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.72.w1.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.72.w2.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.72.w3.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.73.w1.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.73.w2.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.73.w3.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.74.w1.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.74.w2.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.74.w3.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.75.w1.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.75.w2.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.75.w3.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.76.w1.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.76.w2.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.76.w3.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.77.w1.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.77.w2.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.77.w3.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.78.w1.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.78.w2.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.78.w3.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.79.w1.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.79.w2.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.79.w3.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.8.w1.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.8.w2.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.8.w3.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.80.w1.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.80.w2.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.80.w3.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.81.w1.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.81.w2.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.81.w3.weight": "consolidated-00102-of-00272.safetensors", + "layers.30.experts.82.w1.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.82.w2.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.82.w3.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.83.w1.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.83.w2.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.83.w3.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.84.w1.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.84.w2.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.84.w3.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.85.w1.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.85.w2.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.85.w3.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.86.w1.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.86.w2.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.86.w3.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.87.w1.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.87.w2.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.87.w3.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.88.w1.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.88.w2.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.88.w3.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.89.w1.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.89.w2.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.89.w3.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.9.w1.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.9.w2.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.9.w3.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.90.w1.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.90.w2.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.90.w3.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.91.w1.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.91.w2.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.91.w3.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.92.w1.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.92.w2.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.92.w3.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.93.w1.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.93.w2.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.93.w3.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.94.w1.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.94.w2.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.94.w3.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.95.w1.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.95.w2.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.95.w3.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.96.w1.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.96.w2.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.96.w3.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.97.w1.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.97.w2.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.97.w3.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.98.w1.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.98.w2.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.98.w3.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.99.w1.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.99.w2.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.experts.99.w3.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.ffn_norm.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.gate.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.shared_experts.w1.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.shared_experts.w2.weight": "consolidated-00103-of-00272.safetensors", + "layers.30.shared_experts.w3.weight": "consolidated-00103-of-00272.safetensors", + "layers.31.attention.kv_a_norm.weight": "consolidated-00103-of-00272.safetensors", + "layers.31.attention.q_a_norm.weight": "consolidated-00103-of-00272.safetensors", + "layers.31.attention.wkv_a_with_mqa.weight": "consolidated-00103-of-00272.safetensors", + "layers.31.attention.wkv_b.weight": "consolidated-00103-of-00272.safetensors", + "layers.31.attention.wo.weight": "consolidated-00103-of-00272.safetensors", + "layers.31.attention.wq_a.weight": "consolidated-00103-of-00272.safetensors", + "layers.31.attention.wq_b.weight": "consolidated-00103-of-00272.safetensors", + "layers.31.attention_norm.weight": "consolidated-00103-of-00272.safetensors", + "layers.31.experts.0.w1.weight": "consolidated-00103-of-00272.safetensors", + "layers.31.experts.0.w2.weight": "consolidated-00103-of-00272.safetensors", + "layers.31.experts.0.w3.weight": "consolidated-00103-of-00272.safetensors", + "layers.31.experts.1.w1.weight": "consolidated-00103-of-00272.safetensors", + "layers.31.experts.1.w2.weight": "consolidated-00103-of-00272.safetensors", + "layers.31.experts.1.w3.weight": "consolidated-00103-of-00272.safetensors", + "layers.31.experts.10.w1.weight": "consolidated-00103-of-00272.safetensors", + "layers.31.experts.10.w2.weight": "consolidated-00103-of-00272.safetensors", + "layers.31.experts.10.w3.weight": "consolidated-00103-of-00272.safetensors", + "layers.31.experts.100.w1.weight": "consolidated-00103-of-00272.safetensors", + "layers.31.experts.100.w2.weight": "consolidated-00103-of-00272.safetensors", + "layers.31.experts.100.w3.weight": "consolidated-00103-of-00272.safetensors", + "layers.31.experts.101.w1.weight": "consolidated-00103-of-00272.safetensors", + "layers.31.experts.101.w2.weight": "consolidated-00103-of-00272.safetensors", + "layers.31.experts.101.w3.weight": "consolidated-00103-of-00272.safetensors", + "layers.31.experts.102.w1.weight": "consolidated-00103-of-00272.safetensors", + "layers.31.experts.102.w2.weight": "consolidated-00103-of-00272.safetensors", + "layers.31.experts.102.w3.weight": "consolidated-00103-of-00272.safetensors", + "layers.31.experts.103.w1.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.103.w2.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.103.w3.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.104.w1.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.104.w2.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.104.w3.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.105.w1.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.105.w2.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.105.w3.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.106.w1.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.106.w2.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.106.w3.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.107.w1.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.107.w2.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.107.w3.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.108.w1.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.108.w2.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.108.w3.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.109.w1.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.109.w2.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.109.w3.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.11.w1.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.11.w2.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.11.w3.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.110.w1.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.110.w2.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.110.w3.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.111.w1.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.111.w2.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.111.w3.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.112.w1.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.112.w2.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.112.w3.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.113.w1.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.113.w2.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.113.w3.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.114.w1.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.114.w2.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.114.w3.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.115.w1.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.115.w2.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.115.w3.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.116.w1.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.116.w2.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.116.w3.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.117.w1.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.117.w2.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.117.w3.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.118.w1.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.118.w2.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.118.w3.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.119.w1.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.119.w2.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.119.w3.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.12.w1.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.12.w2.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.12.w3.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.120.w1.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.120.w2.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.120.w3.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.121.w1.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.121.w2.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.121.w3.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.122.w1.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.122.w2.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.122.w3.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.123.w1.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.123.w2.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.123.w3.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.124.w1.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.124.w2.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.124.w3.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.125.w1.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.125.w2.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.125.w3.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.126.w1.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.126.w2.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.126.w3.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.127.w1.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.127.w2.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.127.w3.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.13.w1.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.13.w2.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.13.w3.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.14.w1.weight": "consolidated-00104-of-00272.safetensors", + "layers.31.experts.14.w2.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.14.w3.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.15.w1.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.15.w2.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.15.w3.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.16.w1.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.16.w2.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.16.w3.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.17.w1.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.17.w2.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.17.w3.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.18.w1.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.18.w2.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.18.w3.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.19.w1.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.19.w2.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.19.w3.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.2.w1.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.2.w2.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.2.w3.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.20.w1.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.20.w2.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.20.w3.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.21.w1.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.21.w2.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.21.w3.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.22.w1.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.22.w2.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.22.w3.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.23.w1.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.23.w2.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.23.w3.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.24.w1.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.24.w2.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.24.w3.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.25.w1.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.25.w2.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.25.w3.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.26.w1.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.26.w2.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.26.w3.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.27.w1.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.27.w2.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.27.w3.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.28.w1.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.28.w2.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.28.w3.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.29.w1.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.29.w2.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.29.w3.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.3.w1.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.3.w2.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.3.w3.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.30.w1.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.30.w2.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.30.w3.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.31.w1.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.31.w2.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.31.w3.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.32.w1.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.32.w2.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.32.w3.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.33.w1.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.33.w2.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.33.w3.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.34.w1.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.34.w2.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.34.w3.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.35.w1.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.35.w2.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.35.w3.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.36.w1.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.36.w2.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.36.w3.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.37.w1.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.37.w2.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.37.w3.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.38.w1.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.38.w2.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.38.w3.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.39.w1.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.39.w2.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.39.w3.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.4.w1.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.4.w2.weight": "consolidated-00105-of-00272.safetensors", + "layers.31.experts.4.w3.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.40.w1.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.40.w2.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.40.w3.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.41.w1.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.41.w2.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.41.w3.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.42.w1.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.42.w2.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.42.w3.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.43.w1.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.43.w2.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.43.w3.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.44.w1.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.44.w2.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.44.w3.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.45.w1.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.45.w2.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.45.w3.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.46.w1.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.46.w2.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.46.w3.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.47.w1.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.47.w2.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.47.w3.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.48.w1.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.48.w2.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.48.w3.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.49.w1.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.49.w2.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.49.w3.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.5.w1.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.5.w2.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.5.w3.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.50.w1.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.50.w2.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.50.w3.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.51.w1.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.51.w2.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.51.w3.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.52.w1.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.52.w2.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.52.w3.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.53.w1.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.53.w2.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.53.w3.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.54.w1.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.54.w2.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.54.w3.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.55.w1.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.55.w2.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.55.w3.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.56.w1.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.56.w2.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.56.w3.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.57.w1.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.57.w2.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.57.w3.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.58.w1.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.58.w2.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.58.w3.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.59.w1.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.59.w2.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.59.w3.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.6.w1.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.6.w2.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.6.w3.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.60.w1.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.60.w2.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.60.w3.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.61.w1.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.61.w2.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.61.w3.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.62.w1.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.62.w2.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.62.w3.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.63.w1.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.63.w2.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.63.w3.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.64.w1.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.64.w2.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.64.w3.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.65.w1.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.65.w2.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.65.w3.weight": "consolidated-00106-of-00272.safetensors", + "layers.31.experts.66.w1.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.66.w2.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.66.w3.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.67.w1.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.67.w2.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.67.w3.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.68.w1.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.68.w2.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.68.w3.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.69.w1.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.69.w2.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.69.w3.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.7.w1.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.7.w2.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.7.w3.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.70.w1.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.70.w2.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.70.w3.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.71.w1.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.71.w2.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.71.w3.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.72.w1.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.72.w2.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.72.w3.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.73.w1.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.73.w2.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.73.w3.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.74.w1.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.74.w2.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.74.w3.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.75.w1.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.75.w2.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.75.w3.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.76.w1.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.76.w2.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.76.w3.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.77.w1.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.77.w2.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.77.w3.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.78.w1.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.78.w2.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.78.w3.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.79.w1.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.79.w2.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.79.w3.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.8.w1.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.8.w2.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.8.w3.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.80.w1.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.80.w2.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.80.w3.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.81.w1.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.81.w2.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.81.w3.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.82.w1.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.82.w2.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.82.w3.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.83.w1.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.83.w2.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.83.w3.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.84.w1.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.84.w2.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.84.w3.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.85.w1.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.85.w2.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.85.w3.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.86.w1.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.86.w2.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.86.w3.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.87.w1.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.87.w2.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.87.w3.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.88.w1.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.88.w2.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.88.w3.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.89.w1.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.89.w2.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.89.w3.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.9.w1.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.9.w2.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.9.w3.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.90.w1.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.90.w2.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.90.w3.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.91.w1.weight": "consolidated-00107-of-00272.safetensors", + "layers.31.experts.91.w2.weight": "consolidated-00108-of-00272.safetensors", + "layers.31.experts.91.w3.weight": "consolidated-00108-of-00272.safetensors", + "layers.31.experts.92.w1.weight": "consolidated-00108-of-00272.safetensors", + "layers.31.experts.92.w2.weight": "consolidated-00108-of-00272.safetensors", + "layers.31.experts.92.w3.weight": "consolidated-00108-of-00272.safetensors", + "layers.31.experts.93.w1.weight": "consolidated-00108-of-00272.safetensors", + "layers.31.experts.93.w2.weight": "consolidated-00108-of-00272.safetensors", + "layers.31.experts.93.w3.weight": "consolidated-00108-of-00272.safetensors", + "layers.31.experts.94.w1.weight": "consolidated-00108-of-00272.safetensors", + "layers.31.experts.94.w2.weight": "consolidated-00108-of-00272.safetensors", + "layers.31.experts.94.w3.weight": "consolidated-00108-of-00272.safetensors", + "layers.31.experts.95.w1.weight": "consolidated-00108-of-00272.safetensors", + "layers.31.experts.95.w2.weight": "consolidated-00108-of-00272.safetensors", + "layers.31.experts.95.w3.weight": "consolidated-00108-of-00272.safetensors", + "layers.31.experts.96.w1.weight": "consolidated-00108-of-00272.safetensors", + "layers.31.experts.96.w2.weight": "consolidated-00108-of-00272.safetensors", + "layers.31.experts.96.w3.weight": "consolidated-00108-of-00272.safetensors", + "layers.31.experts.97.w1.weight": "consolidated-00108-of-00272.safetensors", + "layers.31.experts.97.w2.weight": "consolidated-00108-of-00272.safetensors", + "layers.31.experts.97.w3.weight": "consolidated-00108-of-00272.safetensors", + "layers.31.experts.98.w1.weight": "consolidated-00108-of-00272.safetensors", + "layers.31.experts.98.w2.weight": "consolidated-00108-of-00272.safetensors", + "layers.31.experts.98.w3.weight": "consolidated-00108-of-00272.safetensors", + "layers.31.experts.99.w1.weight": "consolidated-00108-of-00272.safetensors", + "layers.31.experts.99.w2.weight": "consolidated-00108-of-00272.safetensors", + "layers.31.experts.99.w3.weight": "consolidated-00108-of-00272.safetensors", + "layers.31.ffn_norm.weight": "consolidated-00108-of-00272.safetensors", + "layers.31.gate.weight": "consolidated-00108-of-00272.safetensors", + "layers.31.shared_experts.w1.weight": "consolidated-00108-of-00272.safetensors", + "layers.31.shared_experts.w2.weight": "consolidated-00108-of-00272.safetensors", + "layers.31.shared_experts.w3.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.attention.kv_a_norm.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.attention.q_a_norm.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.attention.wkv_a_with_mqa.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.attention.wkv_b.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.attention.wo.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.attention.wq_a.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.attention.wq_b.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.attention_norm.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.0.w1.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.0.w2.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.0.w3.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.1.w1.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.1.w2.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.1.w3.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.10.w1.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.10.w2.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.10.w3.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.100.w1.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.100.w2.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.100.w3.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.101.w1.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.101.w2.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.101.w3.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.102.w1.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.102.w2.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.102.w3.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.103.w1.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.103.w2.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.103.w3.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.104.w1.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.104.w2.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.104.w3.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.105.w1.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.105.w2.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.105.w3.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.106.w1.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.106.w2.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.106.w3.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.107.w1.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.107.w2.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.107.w3.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.108.w1.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.108.w2.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.108.w3.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.109.w1.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.109.w2.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.109.w3.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.11.w1.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.11.w2.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.11.w3.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.110.w1.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.110.w2.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.110.w3.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.111.w1.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.111.w2.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.111.w3.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.112.w1.weight": "consolidated-00108-of-00272.safetensors", + "layers.32.experts.112.w2.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.112.w3.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.113.w1.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.113.w2.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.113.w3.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.114.w1.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.114.w2.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.114.w3.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.115.w1.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.115.w2.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.115.w3.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.116.w1.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.116.w2.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.116.w3.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.117.w1.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.117.w2.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.117.w3.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.118.w1.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.118.w2.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.118.w3.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.119.w1.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.119.w2.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.119.w3.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.12.w1.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.12.w2.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.12.w3.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.120.w1.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.120.w2.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.120.w3.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.121.w1.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.121.w2.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.121.w3.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.122.w1.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.122.w2.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.122.w3.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.123.w1.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.123.w2.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.123.w3.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.124.w1.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.124.w2.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.124.w3.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.125.w1.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.125.w2.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.125.w3.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.126.w1.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.126.w2.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.126.w3.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.127.w1.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.127.w2.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.127.w3.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.13.w1.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.13.w2.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.13.w3.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.14.w1.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.14.w2.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.14.w3.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.15.w1.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.15.w2.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.15.w3.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.16.w1.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.16.w2.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.16.w3.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.17.w1.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.17.w2.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.17.w3.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.18.w1.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.18.w2.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.18.w3.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.19.w1.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.19.w2.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.19.w3.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.2.w1.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.2.w2.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.2.w3.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.20.w1.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.20.w2.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.20.w3.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.21.w1.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.21.w2.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.21.w3.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.22.w1.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.22.w2.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.22.w3.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.23.w1.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.23.w2.weight": "consolidated-00109-of-00272.safetensors", + "layers.32.experts.23.w3.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.24.w1.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.24.w2.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.24.w3.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.25.w1.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.25.w2.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.25.w3.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.26.w1.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.26.w2.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.26.w3.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.27.w1.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.27.w2.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.27.w3.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.28.w1.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.28.w2.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.28.w3.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.29.w1.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.29.w2.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.29.w3.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.3.w1.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.3.w2.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.3.w3.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.30.w1.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.30.w2.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.30.w3.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.31.w1.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.31.w2.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.31.w3.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.32.w1.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.32.w2.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.32.w3.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.33.w1.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.33.w2.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.33.w3.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.34.w1.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.34.w2.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.34.w3.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.35.w1.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.35.w2.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.35.w3.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.36.w1.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.36.w2.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.36.w3.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.37.w1.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.37.w2.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.37.w3.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.38.w1.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.38.w2.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.38.w3.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.39.w1.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.39.w2.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.39.w3.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.4.w1.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.4.w2.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.4.w3.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.40.w1.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.40.w2.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.40.w3.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.41.w1.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.41.w2.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.41.w3.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.42.w1.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.42.w2.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.42.w3.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.43.w1.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.43.w2.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.43.w3.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.44.w1.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.44.w2.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.44.w3.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.45.w1.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.45.w2.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.45.w3.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.46.w1.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.46.w2.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.46.w3.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.47.w1.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.47.w2.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.47.w3.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.48.w1.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.48.w2.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.48.w3.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.49.w1.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.49.w2.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.49.w3.weight": "consolidated-00110-of-00272.safetensors", + "layers.32.experts.5.w1.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.5.w2.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.5.w3.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.50.w1.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.50.w2.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.50.w3.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.51.w1.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.51.w2.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.51.w3.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.52.w1.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.52.w2.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.52.w3.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.53.w1.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.53.w2.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.53.w3.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.54.w1.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.54.w2.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.54.w3.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.55.w1.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.55.w2.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.55.w3.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.56.w1.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.56.w2.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.56.w3.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.57.w1.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.57.w2.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.57.w3.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.58.w1.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.58.w2.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.58.w3.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.59.w1.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.59.w2.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.59.w3.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.6.w1.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.6.w2.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.6.w3.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.60.w1.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.60.w2.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.60.w3.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.61.w1.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.61.w2.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.61.w3.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.62.w1.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.62.w2.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.62.w3.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.63.w1.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.63.w2.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.63.w3.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.64.w1.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.64.w2.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.64.w3.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.65.w1.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.65.w2.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.65.w3.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.66.w1.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.66.w2.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.66.w3.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.67.w1.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.67.w2.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.67.w3.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.68.w1.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.68.w2.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.68.w3.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.69.w1.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.69.w2.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.69.w3.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.7.w1.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.7.w2.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.7.w3.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.70.w1.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.70.w2.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.70.w3.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.71.w1.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.71.w2.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.71.w3.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.72.w1.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.72.w2.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.72.w3.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.73.w1.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.73.w2.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.73.w3.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.74.w1.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.74.w2.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.74.w3.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.75.w1.weight": "consolidated-00111-of-00272.safetensors", + "layers.32.experts.75.w2.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.75.w3.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.76.w1.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.76.w2.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.76.w3.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.77.w1.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.77.w2.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.77.w3.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.78.w1.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.78.w2.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.78.w3.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.79.w1.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.79.w2.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.79.w3.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.8.w1.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.8.w2.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.8.w3.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.80.w1.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.80.w2.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.80.w3.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.81.w1.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.81.w2.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.81.w3.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.82.w1.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.82.w2.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.82.w3.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.83.w1.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.83.w2.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.83.w3.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.84.w1.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.84.w2.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.84.w3.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.85.w1.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.85.w2.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.85.w3.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.86.w1.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.86.w2.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.86.w3.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.87.w1.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.87.w2.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.87.w3.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.88.w1.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.88.w2.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.88.w3.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.89.w1.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.89.w2.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.89.w3.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.9.w1.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.9.w2.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.9.w3.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.90.w1.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.90.w2.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.90.w3.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.91.w1.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.91.w2.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.91.w3.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.92.w1.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.92.w2.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.92.w3.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.93.w1.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.93.w2.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.93.w3.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.94.w1.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.94.w2.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.94.w3.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.95.w1.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.95.w2.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.95.w3.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.96.w1.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.96.w2.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.96.w3.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.97.w1.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.97.w2.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.97.w3.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.98.w1.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.98.w2.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.98.w3.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.99.w1.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.99.w2.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.experts.99.w3.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.ffn_norm.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.gate.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.shared_experts.w1.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.shared_experts.w2.weight": "consolidated-00112-of-00272.safetensors", + "layers.32.shared_experts.w3.weight": "consolidated-00112-of-00272.safetensors", + "layers.33.attention.kv_a_norm.weight": "consolidated-00112-of-00272.safetensors", + "layers.33.attention.q_a_norm.weight": "consolidated-00112-of-00272.safetensors", + "layers.33.attention.wkv_a_with_mqa.weight": "consolidated-00112-of-00272.safetensors", + "layers.33.attention.wkv_b.weight": "consolidated-00112-of-00272.safetensors", + "layers.33.attention.wo.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.attention.wq_a.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.attention.wq_b.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.attention_norm.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.0.w1.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.0.w2.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.0.w3.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.1.w1.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.1.w2.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.1.w3.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.10.w1.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.10.w2.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.10.w3.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.100.w1.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.100.w2.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.100.w3.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.101.w1.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.101.w2.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.101.w3.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.102.w1.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.102.w2.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.102.w3.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.103.w1.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.103.w2.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.103.w3.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.104.w1.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.104.w2.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.104.w3.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.105.w1.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.105.w2.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.105.w3.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.106.w1.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.106.w2.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.106.w3.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.107.w1.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.107.w2.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.107.w3.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.108.w1.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.108.w2.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.108.w3.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.109.w1.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.109.w2.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.109.w3.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.11.w1.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.11.w2.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.11.w3.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.110.w1.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.110.w2.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.110.w3.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.111.w1.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.111.w2.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.111.w3.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.112.w1.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.112.w2.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.112.w3.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.113.w1.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.113.w2.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.113.w3.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.114.w1.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.114.w2.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.114.w3.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.115.w1.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.115.w2.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.115.w3.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.116.w1.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.116.w2.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.116.w3.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.117.w1.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.117.w2.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.117.w3.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.118.w1.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.118.w2.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.118.w3.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.119.w1.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.119.w2.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.119.w3.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.12.w1.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.12.w2.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.12.w3.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.120.w1.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.120.w2.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.120.w3.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.121.w1.weight": "consolidated-00113-of-00272.safetensors", + "layers.33.experts.121.w2.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.121.w3.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.122.w1.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.122.w2.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.122.w3.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.123.w1.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.123.w2.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.123.w3.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.124.w1.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.124.w2.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.124.w3.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.125.w1.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.125.w2.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.125.w3.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.126.w1.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.126.w2.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.126.w3.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.127.w1.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.127.w2.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.127.w3.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.13.w1.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.13.w2.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.13.w3.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.14.w1.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.14.w2.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.14.w3.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.15.w1.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.15.w2.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.15.w3.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.16.w1.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.16.w2.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.16.w3.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.17.w1.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.17.w2.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.17.w3.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.18.w1.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.18.w2.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.18.w3.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.19.w1.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.19.w2.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.19.w3.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.2.w1.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.2.w2.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.2.w3.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.20.w1.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.20.w2.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.20.w3.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.21.w1.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.21.w2.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.21.w3.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.22.w1.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.22.w2.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.22.w3.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.23.w1.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.23.w2.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.23.w3.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.24.w1.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.24.w2.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.24.w3.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.25.w1.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.25.w2.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.25.w3.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.26.w1.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.26.w2.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.26.w3.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.27.w1.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.27.w2.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.27.w3.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.28.w1.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.28.w2.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.28.w3.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.29.w1.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.29.w2.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.29.w3.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.3.w1.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.3.w2.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.3.w3.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.30.w1.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.30.w2.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.30.w3.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.31.w1.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.31.w2.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.31.w3.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.32.w1.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.32.w2.weight": "consolidated-00114-of-00272.safetensors", + "layers.33.experts.32.w3.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.33.w1.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.33.w2.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.33.w3.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.34.w1.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.34.w2.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.34.w3.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.35.w1.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.35.w2.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.35.w3.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.36.w1.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.36.w2.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.36.w3.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.37.w1.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.37.w2.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.37.w3.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.38.w1.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.38.w2.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.38.w3.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.39.w1.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.39.w2.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.39.w3.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.4.w1.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.4.w2.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.4.w3.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.40.w1.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.40.w2.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.40.w3.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.41.w1.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.41.w2.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.41.w3.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.42.w1.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.42.w2.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.42.w3.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.43.w1.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.43.w2.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.43.w3.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.44.w1.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.44.w2.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.44.w3.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.45.w1.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.45.w2.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.45.w3.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.46.w1.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.46.w2.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.46.w3.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.47.w1.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.47.w2.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.47.w3.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.48.w1.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.48.w2.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.48.w3.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.49.w1.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.49.w2.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.49.w3.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.5.w1.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.5.w2.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.5.w3.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.50.w1.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.50.w2.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.50.w3.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.51.w1.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.51.w2.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.51.w3.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.52.w1.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.52.w2.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.52.w3.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.53.w1.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.53.w2.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.53.w3.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.54.w1.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.54.w2.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.54.w3.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.55.w1.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.55.w2.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.55.w3.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.56.w1.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.56.w2.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.56.w3.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.57.w1.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.57.w2.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.57.w3.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.58.w1.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.58.w2.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.58.w3.weight": "consolidated-00115-of-00272.safetensors", + "layers.33.experts.59.w1.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.59.w2.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.59.w3.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.6.w1.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.6.w2.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.6.w3.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.60.w1.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.60.w2.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.60.w3.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.61.w1.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.61.w2.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.61.w3.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.62.w1.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.62.w2.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.62.w3.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.63.w1.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.63.w2.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.63.w3.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.64.w1.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.64.w2.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.64.w3.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.65.w1.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.65.w2.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.65.w3.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.66.w1.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.66.w2.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.66.w3.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.67.w1.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.67.w2.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.67.w3.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.68.w1.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.68.w2.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.68.w3.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.69.w1.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.69.w2.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.69.w3.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.7.w1.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.7.w2.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.7.w3.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.70.w1.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.70.w2.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.70.w3.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.71.w1.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.71.w2.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.71.w3.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.72.w1.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.72.w2.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.72.w3.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.73.w1.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.73.w2.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.73.w3.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.74.w1.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.74.w2.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.74.w3.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.75.w1.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.75.w2.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.75.w3.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.76.w1.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.76.w2.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.76.w3.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.77.w1.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.77.w2.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.77.w3.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.78.w1.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.78.w2.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.78.w3.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.79.w1.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.79.w2.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.79.w3.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.8.w1.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.8.w2.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.8.w3.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.80.w1.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.80.w2.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.80.w3.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.81.w1.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.81.w2.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.81.w3.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.82.w1.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.82.w2.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.82.w3.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.83.w1.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.83.w2.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.83.w3.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.84.w1.weight": "consolidated-00116-of-00272.safetensors", + "layers.33.experts.84.w2.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.84.w3.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.85.w1.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.85.w2.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.85.w3.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.86.w1.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.86.w2.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.86.w3.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.87.w1.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.87.w2.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.87.w3.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.88.w1.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.88.w2.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.88.w3.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.89.w1.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.89.w2.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.89.w3.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.9.w1.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.9.w2.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.9.w3.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.90.w1.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.90.w2.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.90.w3.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.91.w1.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.91.w2.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.91.w3.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.92.w1.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.92.w2.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.92.w3.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.93.w1.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.93.w2.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.93.w3.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.94.w1.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.94.w2.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.94.w3.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.95.w1.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.95.w2.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.95.w3.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.96.w1.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.96.w2.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.96.w3.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.97.w1.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.97.w2.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.97.w3.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.98.w1.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.98.w2.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.98.w3.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.99.w1.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.99.w2.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.experts.99.w3.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.ffn_norm.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.gate.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.shared_experts.w1.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.shared_experts.w2.weight": "consolidated-00117-of-00272.safetensors", + "layers.33.shared_experts.w3.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.attention.kv_a_norm.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.attention.q_a_norm.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.attention.wkv_a_with_mqa.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.attention.wkv_b.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.attention.wo.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.attention.wq_a.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.attention.wq_b.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.attention_norm.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.experts.0.w1.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.experts.0.w2.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.experts.0.w3.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.experts.1.w1.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.experts.1.w2.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.experts.1.w3.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.experts.10.w1.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.experts.10.w2.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.experts.10.w3.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.experts.100.w1.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.experts.100.w2.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.experts.100.w3.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.experts.101.w1.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.experts.101.w2.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.experts.101.w3.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.experts.102.w1.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.experts.102.w2.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.experts.102.w3.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.experts.103.w1.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.experts.103.w2.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.experts.103.w3.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.experts.104.w1.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.experts.104.w2.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.experts.104.w3.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.experts.105.w1.weight": "consolidated-00117-of-00272.safetensors", + "layers.34.experts.105.w2.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.105.w3.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.106.w1.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.106.w2.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.106.w3.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.107.w1.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.107.w2.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.107.w3.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.108.w1.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.108.w2.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.108.w3.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.109.w1.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.109.w2.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.109.w3.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.11.w1.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.11.w2.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.11.w3.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.110.w1.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.110.w2.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.110.w3.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.111.w1.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.111.w2.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.111.w3.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.112.w1.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.112.w2.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.112.w3.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.113.w1.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.113.w2.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.113.w3.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.114.w1.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.114.w2.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.114.w3.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.115.w1.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.115.w2.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.115.w3.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.116.w1.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.116.w2.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.116.w3.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.117.w1.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.117.w2.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.117.w3.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.118.w1.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.118.w2.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.118.w3.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.119.w1.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.119.w2.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.119.w3.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.12.w1.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.12.w2.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.12.w3.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.120.w1.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.120.w2.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.120.w3.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.121.w1.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.121.w2.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.121.w3.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.122.w1.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.122.w2.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.122.w3.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.123.w1.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.123.w2.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.123.w3.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.124.w1.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.124.w2.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.124.w3.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.125.w1.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.125.w2.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.125.w3.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.126.w1.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.126.w2.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.126.w3.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.127.w1.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.127.w2.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.127.w3.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.13.w1.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.13.w2.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.13.w3.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.14.w1.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.14.w2.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.14.w3.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.15.w1.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.15.w2.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.15.w3.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.16.w1.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.16.w2.weight": "consolidated-00118-of-00272.safetensors", + "layers.34.experts.16.w3.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.17.w1.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.17.w2.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.17.w3.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.18.w1.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.18.w2.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.18.w3.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.19.w1.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.19.w2.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.19.w3.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.2.w1.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.2.w2.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.2.w3.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.20.w1.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.20.w2.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.20.w3.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.21.w1.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.21.w2.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.21.w3.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.22.w1.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.22.w2.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.22.w3.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.23.w1.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.23.w2.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.23.w3.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.24.w1.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.24.w2.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.24.w3.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.25.w1.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.25.w2.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.25.w3.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.26.w1.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.26.w2.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.26.w3.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.27.w1.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.27.w2.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.27.w3.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.28.w1.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.28.w2.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.28.w3.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.29.w1.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.29.w2.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.29.w3.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.3.w1.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.3.w2.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.3.w3.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.30.w1.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.30.w2.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.30.w3.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.31.w1.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.31.w2.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.31.w3.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.32.w1.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.32.w2.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.32.w3.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.33.w1.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.33.w2.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.33.w3.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.34.w1.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.34.w2.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.34.w3.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.35.w1.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.35.w2.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.35.w3.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.36.w1.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.36.w2.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.36.w3.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.37.w1.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.37.w2.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.37.w3.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.38.w1.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.38.w2.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.38.w3.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.39.w1.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.39.w2.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.39.w3.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.4.w1.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.4.w2.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.4.w3.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.40.w1.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.40.w2.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.40.w3.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.41.w1.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.41.w2.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.41.w3.weight": "consolidated-00119-of-00272.safetensors", + "layers.34.experts.42.w1.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.42.w2.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.42.w3.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.43.w1.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.43.w2.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.43.w3.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.44.w1.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.44.w2.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.44.w3.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.45.w1.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.45.w2.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.45.w3.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.46.w1.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.46.w2.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.46.w3.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.47.w1.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.47.w2.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.47.w3.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.48.w1.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.48.w2.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.48.w3.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.49.w1.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.49.w2.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.49.w3.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.5.w1.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.5.w2.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.5.w3.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.50.w1.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.50.w2.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.50.w3.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.51.w1.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.51.w2.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.51.w3.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.52.w1.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.52.w2.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.52.w3.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.53.w1.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.53.w2.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.53.w3.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.54.w1.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.54.w2.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.54.w3.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.55.w1.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.55.w2.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.55.w3.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.56.w1.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.56.w2.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.56.w3.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.57.w1.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.57.w2.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.57.w3.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.58.w1.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.58.w2.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.58.w3.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.59.w1.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.59.w2.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.59.w3.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.6.w1.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.6.w2.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.6.w3.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.60.w1.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.60.w2.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.60.w3.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.61.w1.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.61.w2.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.61.w3.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.62.w1.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.62.w2.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.62.w3.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.63.w1.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.63.w2.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.63.w3.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.64.w1.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.64.w2.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.64.w3.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.65.w1.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.65.w2.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.65.w3.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.66.w1.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.66.w2.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.66.w3.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.67.w1.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.67.w2.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.67.w3.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.68.w1.weight": "consolidated-00120-of-00272.safetensors", + "layers.34.experts.68.w2.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.68.w3.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.69.w1.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.69.w2.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.69.w3.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.7.w1.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.7.w2.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.7.w3.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.70.w1.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.70.w2.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.70.w3.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.71.w1.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.71.w2.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.71.w3.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.72.w1.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.72.w2.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.72.w3.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.73.w1.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.73.w2.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.73.w3.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.74.w1.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.74.w2.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.74.w3.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.75.w1.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.75.w2.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.75.w3.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.76.w1.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.76.w2.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.76.w3.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.77.w1.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.77.w2.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.77.w3.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.78.w1.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.78.w2.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.78.w3.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.79.w1.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.79.w2.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.79.w3.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.8.w1.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.8.w2.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.8.w3.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.80.w1.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.80.w2.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.80.w3.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.81.w1.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.81.w2.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.81.w3.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.82.w1.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.82.w2.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.82.w3.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.83.w1.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.83.w2.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.83.w3.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.84.w1.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.84.w2.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.84.w3.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.85.w1.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.85.w2.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.85.w3.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.86.w1.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.86.w2.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.86.w3.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.87.w1.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.87.w2.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.87.w3.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.88.w1.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.88.w2.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.88.w3.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.89.w1.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.89.w2.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.89.w3.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.9.w1.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.9.w2.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.9.w3.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.90.w1.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.90.w2.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.90.w3.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.91.w1.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.91.w2.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.91.w3.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.92.w1.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.92.w2.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.92.w3.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.93.w1.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.93.w2.weight": "consolidated-00121-of-00272.safetensors", + "layers.34.experts.93.w3.weight": "consolidated-00122-of-00272.safetensors", + "layers.34.experts.94.w1.weight": "consolidated-00122-of-00272.safetensors", + "layers.34.experts.94.w2.weight": "consolidated-00122-of-00272.safetensors", + "layers.34.experts.94.w3.weight": "consolidated-00122-of-00272.safetensors", + "layers.34.experts.95.w1.weight": "consolidated-00122-of-00272.safetensors", + "layers.34.experts.95.w2.weight": "consolidated-00122-of-00272.safetensors", + "layers.34.experts.95.w3.weight": "consolidated-00122-of-00272.safetensors", + "layers.34.experts.96.w1.weight": "consolidated-00122-of-00272.safetensors", + "layers.34.experts.96.w2.weight": "consolidated-00122-of-00272.safetensors", + "layers.34.experts.96.w3.weight": "consolidated-00122-of-00272.safetensors", + "layers.34.experts.97.w1.weight": "consolidated-00122-of-00272.safetensors", + "layers.34.experts.97.w2.weight": "consolidated-00122-of-00272.safetensors", + "layers.34.experts.97.w3.weight": "consolidated-00122-of-00272.safetensors", + "layers.34.experts.98.w1.weight": "consolidated-00122-of-00272.safetensors", + "layers.34.experts.98.w2.weight": "consolidated-00122-of-00272.safetensors", + "layers.34.experts.98.w3.weight": "consolidated-00122-of-00272.safetensors", + "layers.34.experts.99.w1.weight": "consolidated-00122-of-00272.safetensors", + "layers.34.experts.99.w2.weight": "consolidated-00122-of-00272.safetensors", + "layers.34.experts.99.w3.weight": "consolidated-00122-of-00272.safetensors", + "layers.34.ffn_norm.weight": "consolidated-00122-of-00272.safetensors", + "layers.34.gate.weight": "consolidated-00122-of-00272.safetensors", + "layers.34.shared_experts.w1.weight": "consolidated-00122-of-00272.safetensors", + "layers.34.shared_experts.w2.weight": "consolidated-00122-of-00272.safetensors", + "layers.34.shared_experts.w3.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.attention.kv_a_norm.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.attention.q_a_norm.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.attention.wkv_a_with_mqa.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.attention.wkv_b.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.attention.wo.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.attention.wq_a.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.attention.wq_b.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.attention_norm.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.0.w1.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.0.w2.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.0.w3.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.1.w1.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.1.w2.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.1.w3.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.10.w1.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.10.w2.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.10.w3.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.100.w1.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.100.w2.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.100.w3.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.101.w1.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.101.w2.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.101.w3.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.102.w1.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.102.w2.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.102.w3.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.103.w1.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.103.w2.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.103.w3.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.104.w1.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.104.w2.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.104.w3.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.105.w1.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.105.w2.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.105.w3.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.106.w1.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.106.w2.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.106.w3.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.107.w1.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.107.w2.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.107.w3.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.108.w1.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.108.w2.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.108.w3.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.109.w1.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.109.w2.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.109.w3.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.11.w1.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.11.w2.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.11.w3.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.110.w1.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.110.w2.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.110.w3.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.111.w1.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.111.w2.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.111.w3.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.112.w1.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.112.w2.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.112.w3.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.113.w1.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.113.w2.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.113.w3.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.114.w1.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.114.w2.weight": "consolidated-00122-of-00272.safetensors", + "layers.35.experts.114.w3.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.115.w1.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.115.w2.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.115.w3.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.116.w1.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.116.w2.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.116.w3.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.117.w1.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.117.w2.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.117.w3.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.118.w1.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.118.w2.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.118.w3.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.119.w1.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.119.w2.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.119.w3.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.12.w1.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.12.w2.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.12.w3.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.120.w1.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.120.w2.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.120.w3.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.121.w1.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.121.w2.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.121.w3.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.122.w1.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.122.w2.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.122.w3.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.123.w1.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.123.w2.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.123.w3.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.124.w1.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.124.w2.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.124.w3.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.125.w1.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.125.w2.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.125.w3.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.126.w1.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.126.w2.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.126.w3.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.127.w1.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.127.w2.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.127.w3.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.13.w1.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.13.w2.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.13.w3.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.14.w1.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.14.w2.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.14.w3.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.15.w1.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.15.w2.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.15.w3.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.16.w1.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.16.w2.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.16.w3.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.17.w1.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.17.w2.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.17.w3.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.18.w1.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.18.w2.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.18.w3.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.19.w1.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.19.w2.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.19.w3.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.2.w1.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.2.w2.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.2.w3.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.20.w1.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.20.w2.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.20.w3.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.21.w1.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.21.w2.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.21.w3.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.22.w1.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.22.w2.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.22.w3.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.23.w1.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.23.w2.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.23.w3.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.24.w1.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.24.w2.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.24.w3.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.25.w1.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.25.w2.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.25.w3.weight": "consolidated-00123-of-00272.safetensors", + "layers.35.experts.26.w1.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.26.w2.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.26.w3.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.27.w1.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.27.w2.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.27.w3.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.28.w1.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.28.w2.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.28.w3.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.29.w1.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.29.w2.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.29.w3.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.3.w1.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.3.w2.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.3.w3.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.30.w1.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.30.w2.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.30.w3.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.31.w1.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.31.w2.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.31.w3.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.32.w1.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.32.w2.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.32.w3.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.33.w1.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.33.w2.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.33.w3.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.34.w1.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.34.w2.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.34.w3.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.35.w1.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.35.w2.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.35.w3.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.36.w1.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.36.w2.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.36.w3.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.37.w1.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.37.w2.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.37.w3.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.38.w1.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.38.w2.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.38.w3.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.39.w1.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.39.w2.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.39.w3.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.4.w1.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.4.w2.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.4.w3.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.40.w1.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.40.w2.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.40.w3.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.41.w1.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.41.w2.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.41.w3.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.42.w1.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.42.w2.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.42.w3.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.43.w1.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.43.w2.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.43.w3.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.44.w1.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.44.w2.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.44.w3.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.45.w1.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.45.w2.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.45.w3.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.46.w1.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.46.w2.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.46.w3.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.47.w1.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.47.w2.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.47.w3.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.48.w1.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.48.w2.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.48.w3.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.49.w1.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.49.w2.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.49.w3.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.5.w1.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.5.w2.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.5.w3.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.50.w1.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.50.w2.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.50.w3.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.51.w1.weight": "consolidated-00124-of-00272.safetensors", + "layers.35.experts.51.w2.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.51.w3.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.52.w1.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.52.w2.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.52.w3.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.53.w1.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.53.w2.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.53.w3.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.54.w1.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.54.w2.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.54.w3.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.55.w1.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.55.w2.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.55.w3.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.56.w1.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.56.w2.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.56.w3.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.57.w1.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.57.w2.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.57.w3.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.58.w1.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.58.w2.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.58.w3.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.59.w1.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.59.w2.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.59.w3.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.6.w1.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.6.w2.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.6.w3.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.60.w1.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.60.w2.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.60.w3.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.61.w1.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.61.w2.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.61.w3.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.62.w1.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.62.w2.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.62.w3.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.63.w1.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.63.w2.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.63.w3.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.64.w1.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.64.w2.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.64.w3.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.65.w1.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.65.w2.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.65.w3.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.66.w1.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.66.w2.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.66.w3.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.67.w1.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.67.w2.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.67.w3.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.68.w1.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.68.w2.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.68.w3.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.69.w1.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.69.w2.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.69.w3.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.7.w1.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.7.w2.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.7.w3.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.70.w1.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.70.w2.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.70.w3.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.71.w1.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.71.w2.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.71.w3.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.72.w1.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.72.w2.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.72.w3.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.73.w1.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.73.w2.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.73.w3.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.74.w1.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.74.w2.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.74.w3.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.75.w1.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.75.w2.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.75.w3.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.76.w1.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.76.w2.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.76.w3.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.77.w1.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.77.w2.weight": "consolidated-00125-of-00272.safetensors", + "layers.35.experts.77.w3.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.78.w1.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.78.w2.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.78.w3.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.79.w1.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.79.w2.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.79.w3.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.8.w1.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.8.w2.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.8.w3.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.80.w1.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.80.w2.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.80.w3.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.81.w1.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.81.w2.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.81.w3.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.82.w1.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.82.w2.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.82.w3.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.83.w1.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.83.w2.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.83.w3.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.84.w1.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.84.w2.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.84.w3.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.85.w1.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.85.w2.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.85.w3.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.86.w1.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.86.w2.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.86.w3.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.87.w1.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.87.w2.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.87.w3.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.88.w1.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.88.w2.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.88.w3.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.89.w1.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.89.w2.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.89.w3.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.9.w1.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.9.w2.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.9.w3.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.90.w1.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.90.w2.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.90.w3.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.91.w1.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.91.w2.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.91.w3.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.92.w1.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.92.w2.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.92.w3.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.93.w1.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.93.w2.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.93.w3.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.94.w1.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.94.w2.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.94.w3.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.95.w1.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.95.w2.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.95.w3.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.96.w1.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.96.w2.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.96.w3.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.97.w1.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.97.w2.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.97.w3.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.98.w1.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.98.w2.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.98.w3.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.99.w1.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.99.w2.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.experts.99.w3.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.ffn_norm.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.gate.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.shared_experts.w1.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.shared_experts.w2.weight": "consolidated-00126-of-00272.safetensors", + "layers.35.shared_experts.w3.weight": "consolidated-00126-of-00272.safetensors", + "layers.36.attention.kv_a_norm.weight": "consolidated-00126-of-00272.safetensors", + "layers.36.attention.q_a_norm.weight": "consolidated-00126-of-00272.safetensors", + "layers.36.attention.wkv_a_with_mqa.weight": "consolidated-00126-of-00272.safetensors", + "layers.36.attention.wkv_b.weight": "consolidated-00126-of-00272.safetensors", + "layers.36.attention.wo.weight": "consolidated-00126-of-00272.safetensors", + "layers.36.attention.wq_a.weight": "consolidated-00126-of-00272.safetensors", + "layers.36.attention.wq_b.weight": "consolidated-00126-of-00272.safetensors", + "layers.36.attention_norm.weight": "consolidated-00126-of-00272.safetensors", + "layers.36.experts.0.w1.weight": "consolidated-00126-of-00272.safetensors", + "layers.36.experts.0.w2.weight": "consolidated-00126-of-00272.safetensors", + "layers.36.experts.0.w3.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.1.w1.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.1.w2.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.1.w3.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.10.w1.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.10.w2.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.10.w3.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.100.w1.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.100.w2.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.100.w3.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.101.w1.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.101.w2.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.101.w3.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.102.w1.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.102.w2.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.102.w3.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.103.w1.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.103.w2.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.103.w3.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.104.w1.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.104.w2.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.104.w3.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.105.w1.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.105.w2.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.105.w3.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.106.w1.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.106.w2.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.106.w3.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.107.w1.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.107.w2.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.107.w3.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.108.w1.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.108.w2.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.108.w3.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.109.w1.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.109.w2.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.109.w3.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.11.w1.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.11.w2.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.11.w3.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.110.w1.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.110.w2.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.110.w3.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.111.w1.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.111.w2.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.111.w3.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.112.w1.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.112.w2.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.112.w3.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.113.w1.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.113.w2.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.113.w3.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.114.w1.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.114.w2.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.114.w3.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.115.w1.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.115.w2.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.115.w3.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.116.w1.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.116.w2.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.116.w3.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.117.w1.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.117.w2.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.117.w3.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.118.w1.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.118.w2.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.118.w3.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.119.w1.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.119.w2.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.119.w3.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.12.w1.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.12.w2.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.12.w3.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.120.w1.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.120.w2.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.120.w3.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.121.w1.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.121.w2.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.121.w3.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.122.w1.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.122.w2.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.122.w3.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.123.w1.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.123.w2.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.123.w3.weight": "consolidated-00127-of-00272.safetensors", + "layers.36.experts.124.w1.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.124.w2.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.124.w3.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.125.w1.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.125.w2.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.125.w3.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.126.w1.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.126.w2.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.126.w3.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.127.w1.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.127.w2.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.127.w3.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.13.w1.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.13.w2.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.13.w3.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.14.w1.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.14.w2.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.14.w3.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.15.w1.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.15.w2.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.15.w3.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.16.w1.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.16.w2.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.16.w3.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.17.w1.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.17.w2.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.17.w3.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.18.w1.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.18.w2.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.18.w3.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.19.w1.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.19.w2.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.19.w3.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.2.w1.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.2.w2.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.2.w3.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.20.w1.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.20.w2.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.20.w3.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.21.w1.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.21.w2.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.21.w3.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.22.w1.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.22.w2.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.22.w3.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.23.w1.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.23.w2.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.23.w3.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.24.w1.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.24.w2.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.24.w3.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.25.w1.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.25.w2.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.25.w3.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.26.w1.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.26.w2.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.26.w3.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.27.w1.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.27.w2.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.27.w3.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.28.w1.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.28.w2.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.28.w3.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.29.w1.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.29.w2.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.29.w3.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.3.w1.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.3.w2.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.3.w3.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.30.w1.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.30.w2.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.30.w3.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.31.w1.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.31.w2.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.31.w3.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.32.w1.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.32.w2.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.32.w3.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.33.w1.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.33.w2.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.33.w3.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.34.w1.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.34.w2.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.34.w3.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.35.w1.weight": "consolidated-00128-of-00272.safetensors", + "layers.36.experts.35.w2.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.35.w3.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.36.w1.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.36.w2.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.36.w3.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.37.w1.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.37.w2.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.37.w3.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.38.w1.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.38.w2.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.38.w3.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.39.w1.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.39.w2.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.39.w3.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.4.w1.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.4.w2.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.4.w3.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.40.w1.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.40.w2.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.40.w3.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.41.w1.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.41.w2.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.41.w3.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.42.w1.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.42.w2.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.42.w3.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.43.w1.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.43.w2.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.43.w3.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.44.w1.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.44.w2.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.44.w3.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.45.w1.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.45.w2.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.45.w3.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.46.w1.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.46.w2.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.46.w3.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.47.w1.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.47.w2.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.47.w3.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.48.w1.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.48.w2.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.48.w3.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.49.w1.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.49.w2.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.49.w3.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.5.w1.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.5.w2.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.5.w3.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.50.w1.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.50.w2.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.50.w3.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.51.w1.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.51.w2.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.51.w3.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.52.w1.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.52.w2.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.52.w3.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.53.w1.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.53.w2.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.53.w3.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.54.w1.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.54.w2.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.54.w3.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.55.w1.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.55.w2.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.55.w3.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.56.w1.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.56.w2.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.56.w3.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.57.w1.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.57.w2.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.57.w3.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.58.w1.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.58.w2.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.58.w3.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.59.w1.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.59.w2.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.59.w3.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.6.w1.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.6.w2.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.6.w3.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.60.w1.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.60.w2.weight": "consolidated-00129-of-00272.safetensors", + "layers.36.experts.60.w3.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.61.w1.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.61.w2.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.61.w3.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.62.w1.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.62.w2.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.62.w3.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.63.w1.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.63.w2.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.63.w3.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.64.w1.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.64.w2.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.64.w3.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.65.w1.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.65.w2.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.65.w3.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.66.w1.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.66.w2.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.66.w3.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.67.w1.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.67.w2.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.67.w3.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.68.w1.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.68.w2.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.68.w3.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.69.w1.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.69.w2.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.69.w3.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.7.w1.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.7.w2.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.7.w3.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.70.w1.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.70.w2.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.70.w3.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.71.w1.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.71.w2.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.71.w3.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.72.w1.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.72.w2.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.72.w3.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.73.w1.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.73.w2.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.73.w3.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.74.w1.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.74.w2.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.74.w3.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.75.w1.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.75.w2.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.75.w3.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.76.w1.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.76.w2.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.76.w3.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.77.w1.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.77.w2.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.77.w3.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.78.w1.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.78.w2.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.78.w3.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.79.w1.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.79.w2.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.79.w3.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.8.w1.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.8.w2.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.8.w3.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.80.w1.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.80.w2.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.80.w3.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.81.w1.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.81.w2.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.81.w3.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.82.w1.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.82.w2.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.82.w3.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.83.w1.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.83.w2.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.83.w3.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.84.w1.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.84.w2.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.84.w3.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.85.w1.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.85.w2.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.85.w3.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.86.w1.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.86.w2.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.86.w3.weight": "consolidated-00130-of-00272.safetensors", + "layers.36.experts.87.w1.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.87.w2.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.87.w3.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.88.w1.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.88.w2.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.88.w3.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.89.w1.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.89.w2.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.89.w3.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.9.w1.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.9.w2.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.9.w3.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.90.w1.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.90.w2.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.90.w3.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.91.w1.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.91.w2.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.91.w3.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.92.w1.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.92.w2.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.92.w3.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.93.w1.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.93.w2.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.93.w3.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.94.w1.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.94.w2.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.94.w3.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.95.w1.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.95.w2.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.95.w3.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.96.w1.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.96.w2.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.96.w3.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.97.w1.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.97.w2.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.97.w3.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.98.w1.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.98.w2.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.98.w3.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.99.w1.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.99.w2.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.experts.99.w3.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.ffn_norm.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.gate.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.shared_experts.w1.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.shared_experts.w2.weight": "consolidated-00131-of-00272.safetensors", + "layers.36.shared_experts.w3.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.attention.kv_a_norm.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.attention.q_a_norm.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.attention.wkv_a_with_mqa.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.attention.wkv_b.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.attention.wo.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.attention.wq_a.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.attention.wq_b.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.attention_norm.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.0.w1.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.0.w2.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.0.w3.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.1.w1.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.1.w2.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.1.w3.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.10.w1.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.10.w2.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.10.w3.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.100.w1.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.100.w2.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.100.w3.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.101.w1.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.101.w2.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.101.w3.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.102.w1.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.102.w2.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.102.w3.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.103.w1.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.103.w2.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.103.w3.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.104.w1.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.104.w2.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.104.w3.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.105.w1.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.105.w2.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.105.w3.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.106.w1.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.106.w2.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.106.w3.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.107.w1.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.107.w2.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.107.w3.weight": "consolidated-00131-of-00272.safetensors", + "layers.37.experts.108.w1.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.108.w2.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.108.w3.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.109.w1.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.109.w2.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.109.w3.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.11.w1.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.11.w2.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.11.w3.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.110.w1.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.110.w2.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.110.w3.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.111.w1.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.111.w2.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.111.w3.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.112.w1.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.112.w2.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.112.w3.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.113.w1.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.113.w2.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.113.w3.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.114.w1.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.114.w2.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.114.w3.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.115.w1.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.115.w2.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.115.w3.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.116.w1.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.116.w2.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.116.w3.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.117.w1.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.117.w2.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.117.w3.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.118.w1.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.118.w2.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.118.w3.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.119.w1.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.119.w2.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.119.w3.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.12.w1.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.12.w2.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.12.w3.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.120.w1.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.120.w2.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.120.w3.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.121.w1.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.121.w2.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.121.w3.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.122.w1.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.122.w2.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.122.w3.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.123.w1.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.123.w2.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.123.w3.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.124.w1.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.124.w2.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.124.w3.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.125.w1.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.125.w2.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.125.w3.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.126.w1.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.126.w2.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.126.w3.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.127.w1.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.127.w2.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.127.w3.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.13.w1.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.13.w2.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.13.w3.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.14.w1.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.14.w2.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.14.w3.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.15.w1.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.15.w2.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.15.w3.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.16.w1.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.16.w2.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.16.w3.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.17.w1.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.17.w2.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.17.w3.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.18.w1.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.18.w2.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.18.w3.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.19.w1.weight": "consolidated-00132-of-00272.safetensors", + "layers.37.experts.19.w2.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.19.w3.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.2.w1.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.2.w2.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.2.w3.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.20.w1.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.20.w2.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.20.w3.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.21.w1.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.21.w2.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.21.w3.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.22.w1.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.22.w2.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.22.w3.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.23.w1.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.23.w2.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.23.w3.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.24.w1.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.24.w2.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.24.w3.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.25.w1.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.25.w2.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.25.w3.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.26.w1.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.26.w2.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.26.w3.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.27.w1.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.27.w2.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.27.w3.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.28.w1.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.28.w2.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.28.w3.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.29.w1.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.29.w2.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.29.w3.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.3.w1.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.3.w2.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.3.w3.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.30.w1.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.30.w2.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.30.w3.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.31.w1.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.31.w2.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.31.w3.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.32.w1.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.32.w2.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.32.w3.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.33.w1.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.33.w2.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.33.w3.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.34.w1.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.34.w2.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.34.w3.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.35.w1.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.35.w2.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.35.w3.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.36.w1.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.36.w2.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.36.w3.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.37.w1.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.37.w2.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.37.w3.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.38.w1.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.38.w2.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.38.w3.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.39.w1.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.39.w2.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.39.w3.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.4.w1.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.4.w2.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.4.w3.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.40.w1.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.40.w2.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.40.w3.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.41.w1.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.41.w2.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.41.w3.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.42.w1.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.42.w2.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.42.w3.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.43.w1.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.43.w2.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.43.w3.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.44.w1.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.44.w2.weight": "consolidated-00133-of-00272.safetensors", + "layers.37.experts.44.w3.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.45.w1.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.45.w2.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.45.w3.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.46.w1.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.46.w2.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.46.w3.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.47.w1.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.47.w2.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.47.w3.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.48.w1.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.48.w2.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.48.w3.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.49.w1.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.49.w2.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.49.w3.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.5.w1.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.5.w2.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.5.w3.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.50.w1.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.50.w2.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.50.w3.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.51.w1.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.51.w2.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.51.w3.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.52.w1.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.52.w2.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.52.w3.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.53.w1.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.53.w2.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.53.w3.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.54.w1.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.54.w2.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.54.w3.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.55.w1.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.55.w2.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.55.w3.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.56.w1.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.56.w2.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.56.w3.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.57.w1.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.57.w2.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.57.w3.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.58.w1.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.58.w2.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.58.w3.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.59.w1.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.59.w2.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.59.w3.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.6.w1.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.6.w2.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.6.w3.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.60.w1.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.60.w2.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.60.w3.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.61.w1.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.61.w2.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.61.w3.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.62.w1.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.62.w2.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.62.w3.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.63.w1.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.63.w2.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.63.w3.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.64.w1.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.64.w2.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.64.w3.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.65.w1.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.65.w2.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.65.w3.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.66.w1.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.66.w2.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.66.w3.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.67.w1.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.67.w2.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.67.w3.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.68.w1.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.68.w2.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.68.w3.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.69.w1.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.69.w2.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.69.w3.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.7.w1.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.7.w2.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.7.w3.weight": "consolidated-00134-of-00272.safetensors", + "layers.37.experts.70.w1.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.70.w2.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.70.w3.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.71.w1.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.71.w2.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.71.w3.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.72.w1.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.72.w2.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.72.w3.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.73.w1.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.73.w2.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.73.w3.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.74.w1.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.74.w2.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.74.w3.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.75.w1.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.75.w2.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.75.w3.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.76.w1.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.76.w2.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.76.w3.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.77.w1.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.77.w2.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.77.w3.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.78.w1.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.78.w2.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.78.w3.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.79.w1.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.79.w2.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.79.w3.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.8.w1.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.8.w2.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.8.w3.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.80.w1.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.80.w2.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.80.w3.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.81.w1.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.81.w2.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.81.w3.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.82.w1.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.82.w2.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.82.w3.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.83.w1.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.83.w2.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.83.w3.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.84.w1.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.84.w2.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.84.w3.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.85.w1.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.85.w2.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.85.w3.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.86.w1.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.86.w2.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.86.w3.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.87.w1.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.87.w2.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.87.w3.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.88.w1.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.88.w2.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.88.w3.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.89.w1.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.89.w2.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.89.w3.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.9.w1.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.9.w2.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.9.w3.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.90.w1.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.90.w2.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.90.w3.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.91.w1.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.91.w2.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.91.w3.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.92.w1.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.92.w2.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.92.w3.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.93.w1.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.93.w2.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.93.w3.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.94.w1.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.94.w2.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.94.w3.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.95.w1.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.95.w2.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.95.w3.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.96.w1.weight": "consolidated-00135-of-00272.safetensors", + "layers.37.experts.96.w2.weight": "consolidated-00136-of-00272.safetensors", + "layers.37.experts.96.w3.weight": "consolidated-00136-of-00272.safetensors", + "layers.37.experts.97.w1.weight": "consolidated-00136-of-00272.safetensors", + "layers.37.experts.97.w2.weight": "consolidated-00136-of-00272.safetensors", + "layers.37.experts.97.w3.weight": "consolidated-00136-of-00272.safetensors", + "layers.37.experts.98.w1.weight": "consolidated-00136-of-00272.safetensors", + "layers.37.experts.98.w2.weight": "consolidated-00136-of-00272.safetensors", + "layers.37.experts.98.w3.weight": "consolidated-00136-of-00272.safetensors", + "layers.37.experts.99.w1.weight": "consolidated-00136-of-00272.safetensors", + "layers.37.experts.99.w2.weight": "consolidated-00136-of-00272.safetensors", + "layers.37.experts.99.w3.weight": "consolidated-00136-of-00272.safetensors", + "layers.37.ffn_norm.weight": "consolidated-00136-of-00272.safetensors", + "layers.37.gate.weight": "consolidated-00136-of-00272.safetensors", + "layers.37.shared_experts.w1.weight": "consolidated-00136-of-00272.safetensors", + "layers.37.shared_experts.w2.weight": "consolidated-00136-of-00272.safetensors", + "layers.37.shared_experts.w3.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.attention.kv_a_norm.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.attention.q_a_norm.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.attention.wkv_a_with_mqa.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.attention.wkv_b.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.attention.wo.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.attention.wq_a.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.attention.wq_b.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.attention_norm.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.0.w1.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.0.w2.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.0.w3.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.1.w1.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.1.w2.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.1.w3.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.10.w1.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.10.w2.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.10.w3.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.100.w1.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.100.w2.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.100.w3.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.101.w1.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.101.w2.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.101.w3.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.102.w1.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.102.w2.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.102.w3.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.103.w1.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.103.w2.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.103.w3.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.104.w1.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.104.w2.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.104.w3.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.105.w1.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.105.w2.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.105.w3.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.106.w1.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.106.w2.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.106.w3.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.107.w1.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.107.w2.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.107.w3.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.108.w1.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.108.w2.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.108.w3.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.109.w1.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.109.w2.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.109.w3.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.11.w1.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.11.w2.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.11.w3.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.110.w1.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.110.w2.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.110.w3.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.111.w1.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.111.w2.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.111.w3.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.112.w1.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.112.w2.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.112.w3.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.113.w1.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.113.w2.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.113.w3.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.114.w1.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.114.w2.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.114.w3.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.115.w1.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.115.w2.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.115.w3.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.116.w1.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.116.w2.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.116.w3.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.117.w1.weight": "consolidated-00136-of-00272.safetensors", + "layers.38.experts.117.w2.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.117.w3.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.118.w1.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.118.w2.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.118.w3.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.119.w1.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.119.w2.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.119.w3.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.12.w1.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.12.w2.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.12.w3.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.120.w1.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.120.w2.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.120.w3.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.121.w1.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.121.w2.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.121.w3.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.122.w1.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.122.w2.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.122.w3.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.123.w1.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.123.w2.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.123.w3.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.124.w1.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.124.w2.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.124.w3.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.125.w1.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.125.w2.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.125.w3.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.126.w1.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.126.w2.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.126.w3.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.127.w1.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.127.w2.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.127.w3.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.13.w1.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.13.w2.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.13.w3.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.14.w1.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.14.w2.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.14.w3.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.15.w1.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.15.w2.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.15.w3.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.16.w1.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.16.w2.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.16.w3.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.17.w1.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.17.w2.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.17.w3.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.18.w1.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.18.w2.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.18.w3.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.19.w1.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.19.w2.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.19.w3.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.2.w1.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.2.w2.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.2.w3.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.20.w1.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.20.w2.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.20.w3.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.21.w1.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.21.w2.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.21.w3.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.22.w1.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.22.w2.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.22.w3.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.23.w1.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.23.w2.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.23.w3.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.24.w1.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.24.w2.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.24.w3.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.25.w1.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.25.w2.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.25.w3.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.26.w1.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.26.w2.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.26.w3.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.27.w1.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.27.w2.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.27.w3.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.28.w1.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.28.w2.weight": "consolidated-00137-of-00272.safetensors", + "layers.38.experts.28.w3.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.29.w1.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.29.w2.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.29.w3.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.3.w1.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.3.w2.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.3.w3.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.30.w1.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.30.w2.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.30.w3.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.31.w1.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.31.w2.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.31.w3.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.32.w1.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.32.w2.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.32.w3.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.33.w1.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.33.w2.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.33.w3.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.34.w1.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.34.w2.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.34.w3.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.35.w1.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.35.w2.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.35.w3.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.36.w1.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.36.w2.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.36.w3.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.37.w1.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.37.w2.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.37.w3.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.38.w1.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.38.w2.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.38.w3.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.39.w1.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.39.w2.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.39.w3.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.4.w1.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.4.w2.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.4.w3.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.40.w1.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.40.w2.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.40.w3.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.41.w1.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.41.w2.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.41.w3.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.42.w1.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.42.w2.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.42.w3.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.43.w1.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.43.w2.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.43.w3.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.44.w1.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.44.w2.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.44.w3.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.45.w1.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.45.w2.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.45.w3.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.46.w1.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.46.w2.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.46.w3.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.47.w1.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.47.w2.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.47.w3.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.48.w1.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.48.w2.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.48.w3.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.49.w1.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.49.w2.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.49.w3.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.5.w1.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.5.w2.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.5.w3.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.50.w1.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.50.w2.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.50.w3.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.51.w1.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.51.w2.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.51.w3.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.52.w1.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.52.w2.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.52.w3.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.53.w1.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.53.w2.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.53.w3.weight": "consolidated-00138-of-00272.safetensors", + "layers.38.experts.54.w1.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.54.w2.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.54.w3.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.55.w1.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.55.w2.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.55.w3.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.56.w1.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.56.w2.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.56.w3.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.57.w1.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.57.w2.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.57.w3.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.58.w1.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.58.w2.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.58.w3.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.59.w1.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.59.w2.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.59.w3.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.6.w1.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.6.w2.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.6.w3.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.60.w1.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.60.w2.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.60.w3.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.61.w1.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.61.w2.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.61.w3.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.62.w1.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.62.w2.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.62.w3.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.63.w1.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.63.w2.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.63.w3.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.64.w1.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.64.w2.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.64.w3.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.65.w1.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.65.w2.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.65.w3.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.66.w1.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.66.w2.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.66.w3.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.67.w1.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.67.w2.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.67.w3.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.68.w1.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.68.w2.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.68.w3.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.69.w1.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.69.w2.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.69.w3.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.7.w1.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.7.w2.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.7.w3.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.70.w1.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.70.w2.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.70.w3.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.71.w1.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.71.w2.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.71.w3.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.72.w1.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.72.w2.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.72.w3.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.73.w1.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.73.w2.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.73.w3.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.74.w1.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.74.w2.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.74.w3.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.75.w1.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.75.w2.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.75.w3.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.76.w1.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.76.w2.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.76.w3.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.77.w1.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.77.w2.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.77.w3.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.78.w1.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.78.w2.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.78.w3.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.79.w1.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.79.w2.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.79.w3.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.8.w1.weight": "consolidated-00139-of-00272.safetensors", + "layers.38.experts.8.w2.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.8.w3.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.80.w1.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.80.w2.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.80.w3.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.81.w1.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.81.w2.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.81.w3.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.82.w1.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.82.w2.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.82.w3.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.83.w1.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.83.w2.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.83.w3.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.84.w1.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.84.w2.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.84.w3.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.85.w1.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.85.w2.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.85.w3.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.86.w1.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.86.w2.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.86.w3.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.87.w1.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.87.w2.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.87.w3.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.88.w1.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.88.w2.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.88.w3.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.89.w1.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.89.w2.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.89.w3.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.9.w1.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.9.w2.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.9.w3.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.90.w1.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.90.w2.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.90.w3.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.91.w1.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.91.w2.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.91.w3.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.92.w1.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.92.w2.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.92.w3.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.93.w1.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.93.w2.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.93.w3.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.94.w1.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.94.w2.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.94.w3.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.95.w1.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.95.w2.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.95.w3.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.96.w1.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.96.w2.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.96.w3.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.97.w1.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.97.w2.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.97.w3.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.98.w1.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.98.w2.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.98.w3.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.99.w1.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.99.w2.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.experts.99.w3.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.ffn_norm.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.gate.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.shared_experts.w1.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.shared_experts.w2.weight": "consolidated-00140-of-00272.safetensors", + "layers.38.shared_experts.w3.weight": "consolidated-00140-of-00272.safetensors", + "layers.39.attention.kv_a_norm.weight": "consolidated-00140-of-00272.safetensors", + "layers.39.attention.q_a_norm.weight": "consolidated-00140-of-00272.safetensors", + "layers.39.attention.wkv_a_with_mqa.weight": "consolidated-00140-of-00272.safetensors", + "layers.39.attention.wkv_b.weight": "consolidated-00140-of-00272.safetensors", + "layers.39.attention.wo.weight": "consolidated-00140-of-00272.safetensors", + "layers.39.attention.wq_a.weight": "consolidated-00140-of-00272.safetensors", + "layers.39.attention.wq_b.weight": "consolidated-00140-of-00272.safetensors", + "layers.39.attention_norm.weight": "consolidated-00140-of-00272.safetensors", + "layers.39.experts.0.w1.weight": "consolidated-00140-of-00272.safetensors", + "layers.39.experts.0.w2.weight": "consolidated-00140-of-00272.safetensors", + "layers.39.experts.0.w3.weight": "consolidated-00140-of-00272.safetensors", + "layers.39.experts.1.w1.weight": "consolidated-00140-of-00272.safetensors", + "layers.39.experts.1.w2.weight": "consolidated-00140-of-00272.safetensors", + "layers.39.experts.1.w3.weight": "consolidated-00140-of-00272.safetensors", + "layers.39.experts.10.w1.weight": "consolidated-00140-of-00272.safetensors", + "layers.39.experts.10.w2.weight": "consolidated-00140-of-00272.safetensors", + "layers.39.experts.10.w3.weight": "consolidated-00140-of-00272.safetensors", + "layers.39.experts.100.w1.weight": "consolidated-00140-of-00272.safetensors", + "layers.39.experts.100.w2.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.100.w3.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.101.w1.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.101.w2.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.101.w3.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.102.w1.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.102.w2.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.102.w3.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.103.w1.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.103.w2.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.103.w3.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.104.w1.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.104.w2.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.104.w3.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.105.w1.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.105.w2.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.105.w3.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.106.w1.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.106.w2.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.106.w3.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.107.w1.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.107.w2.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.107.w3.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.108.w1.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.108.w2.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.108.w3.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.109.w1.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.109.w2.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.109.w3.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.11.w1.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.11.w2.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.11.w3.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.110.w1.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.110.w2.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.110.w3.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.111.w1.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.111.w2.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.111.w3.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.112.w1.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.112.w2.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.112.w3.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.113.w1.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.113.w2.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.113.w3.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.114.w1.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.114.w2.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.114.w3.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.115.w1.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.115.w2.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.115.w3.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.116.w1.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.116.w2.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.116.w3.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.117.w1.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.117.w2.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.117.w3.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.118.w1.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.118.w2.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.118.w3.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.119.w1.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.119.w2.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.119.w3.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.12.w1.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.12.w2.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.12.w3.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.120.w1.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.120.w2.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.120.w3.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.121.w1.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.121.w2.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.121.w3.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.122.w1.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.122.w2.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.122.w3.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.123.w1.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.123.w2.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.123.w3.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.124.w1.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.124.w2.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.124.w3.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.125.w1.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.125.w2.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.125.w3.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.126.w1.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.126.w2.weight": "consolidated-00141-of-00272.safetensors", + "layers.39.experts.126.w3.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.127.w1.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.127.w2.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.127.w3.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.13.w1.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.13.w2.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.13.w3.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.14.w1.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.14.w2.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.14.w3.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.15.w1.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.15.w2.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.15.w3.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.16.w1.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.16.w2.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.16.w3.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.17.w1.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.17.w2.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.17.w3.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.18.w1.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.18.w2.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.18.w3.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.19.w1.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.19.w2.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.19.w3.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.2.w1.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.2.w2.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.2.w3.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.20.w1.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.20.w2.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.20.w3.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.21.w1.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.21.w2.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.21.w3.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.22.w1.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.22.w2.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.22.w3.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.23.w1.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.23.w2.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.23.w3.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.24.w1.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.24.w2.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.24.w3.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.25.w1.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.25.w2.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.25.w3.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.26.w1.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.26.w2.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.26.w3.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.27.w1.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.27.w2.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.27.w3.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.28.w1.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.28.w2.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.28.w3.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.29.w1.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.29.w2.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.29.w3.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.3.w1.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.3.w2.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.3.w3.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.30.w1.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.30.w2.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.30.w3.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.31.w1.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.31.w2.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.31.w3.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.32.w1.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.32.w2.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.32.w3.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.33.w1.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.33.w2.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.33.w3.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.34.w1.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.34.w2.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.34.w3.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.35.w1.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.35.w2.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.35.w3.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.36.w1.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.36.w2.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.36.w3.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.37.w1.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.37.w2.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.37.w3.weight": "consolidated-00142-of-00272.safetensors", + "layers.39.experts.38.w1.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.38.w2.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.38.w3.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.39.w1.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.39.w2.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.39.w3.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.4.w1.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.4.w2.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.4.w3.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.40.w1.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.40.w2.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.40.w3.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.41.w1.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.41.w2.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.41.w3.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.42.w1.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.42.w2.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.42.w3.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.43.w1.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.43.w2.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.43.w3.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.44.w1.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.44.w2.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.44.w3.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.45.w1.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.45.w2.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.45.w3.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.46.w1.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.46.w2.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.46.w3.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.47.w1.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.47.w2.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.47.w3.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.48.w1.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.48.w2.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.48.w3.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.49.w1.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.49.w2.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.49.w3.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.5.w1.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.5.w2.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.5.w3.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.50.w1.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.50.w2.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.50.w3.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.51.w1.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.51.w2.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.51.w3.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.52.w1.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.52.w2.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.52.w3.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.53.w1.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.53.w2.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.53.w3.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.54.w1.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.54.w2.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.54.w3.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.55.w1.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.55.w2.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.55.w3.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.56.w1.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.56.w2.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.56.w3.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.57.w1.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.57.w2.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.57.w3.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.58.w1.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.58.w2.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.58.w3.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.59.w1.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.59.w2.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.59.w3.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.6.w1.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.6.w2.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.6.w3.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.60.w1.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.60.w2.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.60.w3.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.61.w1.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.61.w2.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.61.w3.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.62.w1.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.62.w2.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.62.w3.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.63.w1.weight": "consolidated-00143-of-00272.safetensors", + "layers.39.experts.63.w2.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.63.w3.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.64.w1.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.64.w2.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.64.w3.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.65.w1.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.65.w2.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.65.w3.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.66.w1.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.66.w2.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.66.w3.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.67.w1.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.67.w2.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.67.w3.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.68.w1.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.68.w2.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.68.w3.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.69.w1.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.69.w2.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.69.w3.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.7.w1.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.7.w2.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.7.w3.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.70.w1.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.70.w2.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.70.w3.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.71.w1.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.71.w2.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.71.w3.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.72.w1.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.72.w2.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.72.w3.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.73.w1.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.73.w2.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.73.w3.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.74.w1.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.74.w2.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.74.w3.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.75.w1.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.75.w2.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.75.w3.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.76.w1.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.76.w2.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.76.w3.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.77.w1.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.77.w2.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.77.w3.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.78.w1.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.78.w2.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.78.w3.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.79.w1.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.79.w2.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.79.w3.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.8.w1.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.8.w2.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.8.w3.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.80.w1.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.80.w2.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.80.w3.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.81.w1.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.81.w2.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.81.w3.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.82.w1.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.82.w2.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.82.w3.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.83.w1.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.83.w2.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.83.w3.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.84.w1.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.84.w2.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.84.w3.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.85.w1.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.85.w2.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.85.w3.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.86.w1.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.86.w2.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.86.w3.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.87.w1.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.87.w2.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.87.w3.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.88.w1.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.88.w2.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.88.w3.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.89.w1.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.89.w2.weight": "consolidated-00144-of-00272.safetensors", + "layers.39.experts.89.w3.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.9.w1.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.9.w2.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.9.w3.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.90.w1.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.90.w2.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.90.w3.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.91.w1.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.91.w2.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.91.w3.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.92.w1.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.92.w2.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.92.w3.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.93.w1.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.93.w2.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.93.w3.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.94.w1.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.94.w2.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.94.w3.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.95.w1.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.95.w2.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.95.w3.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.96.w1.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.96.w2.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.96.w3.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.97.w1.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.97.w2.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.97.w3.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.98.w1.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.98.w2.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.98.w3.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.99.w1.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.99.w2.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.experts.99.w3.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.ffn_norm.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.gate.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.shared_experts.w1.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.shared_experts.w2.weight": "consolidated-00145-of-00272.safetensors", + "layers.39.shared_experts.w3.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.attention.kv_a_norm.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.attention.q_a_norm.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.attention.wkv_a_with_mqa.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.attention.wkv_b.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.attention.wo.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.attention.wq_a.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.attention.wq_b.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.attention_norm.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.0.w1.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.0.w2.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.0.w3.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.1.w1.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.1.w2.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.1.w3.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.10.w1.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.10.w2.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.10.w3.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.100.w1.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.100.w2.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.100.w3.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.101.w1.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.101.w2.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.101.w3.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.102.w1.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.102.w2.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.102.w3.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.103.w1.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.103.w2.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.103.w3.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.104.w1.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.104.w2.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.104.w3.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.105.w1.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.105.w2.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.105.w3.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.106.w1.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.106.w2.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.106.w3.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.107.w1.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.107.w2.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.107.w3.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.108.w1.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.108.w2.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.108.w3.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.109.w1.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.109.w2.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.109.w3.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.11.w1.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.11.w2.weight": "consolidated-00145-of-00272.safetensors", + "layers.4.experts.11.w3.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.110.w1.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.110.w2.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.110.w3.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.111.w1.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.111.w2.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.111.w3.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.112.w1.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.112.w2.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.112.w3.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.113.w1.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.113.w2.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.113.w3.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.114.w1.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.114.w2.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.114.w3.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.115.w1.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.115.w2.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.115.w3.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.116.w1.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.116.w2.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.116.w3.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.117.w1.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.117.w2.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.117.w3.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.118.w1.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.118.w2.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.118.w3.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.119.w1.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.119.w2.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.119.w3.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.12.w1.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.12.w2.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.12.w3.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.120.w1.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.120.w2.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.120.w3.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.121.w1.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.121.w2.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.121.w3.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.122.w1.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.122.w2.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.122.w3.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.123.w1.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.123.w2.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.123.w3.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.124.w1.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.124.w2.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.124.w3.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.125.w1.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.125.w2.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.125.w3.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.126.w1.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.126.w2.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.126.w3.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.127.w1.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.127.w2.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.127.w3.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.13.w1.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.13.w2.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.13.w3.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.14.w1.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.14.w2.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.14.w3.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.15.w1.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.15.w2.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.15.w3.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.16.w1.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.16.w2.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.16.w3.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.17.w1.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.17.w2.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.17.w3.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.18.w1.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.18.w2.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.18.w3.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.19.w1.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.19.w2.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.19.w3.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.2.w1.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.2.w2.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.2.w3.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.20.w1.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.20.w2.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.20.w3.weight": "consolidated-00146-of-00272.safetensors", + "layers.4.experts.21.w1.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.21.w2.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.21.w3.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.22.w1.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.22.w2.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.22.w3.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.23.w1.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.23.w2.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.23.w3.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.24.w1.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.24.w2.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.24.w3.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.25.w1.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.25.w2.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.25.w3.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.26.w1.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.26.w2.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.26.w3.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.27.w1.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.27.w2.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.27.w3.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.28.w1.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.28.w2.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.28.w3.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.29.w1.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.29.w2.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.29.w3.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.3.w1.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.3.w2.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.3.w3.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.30.w1.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.30.w2.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.30.w3.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.31.w1.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.31.w2.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.31.w3.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.32.w1.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.32.w2.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.32.w3.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.33.w1.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.33.w2.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.33.w3.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.34.w1.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.34.w2.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.34.w3.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.35.w1.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.35.w2.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.35.w3.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.36.w1.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.36.w2.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.36.w3.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.37.w1.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.37.w2.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.37.w3.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.38.w1.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.38.w2.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.38.w3.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.39.w1.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.39.w2.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.39.w3.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.4.w1.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.4.w2.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.4.w3.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.40.w1.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.40.w2.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.40.w3.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.41.w1.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.41.w2.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.41.w3.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.42.w1.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.42.w2.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.42.w3.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.43.w1.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.43.w2.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.43.w3.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.44.w1.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.44.w2.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.44.w3.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.45.w1.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.45.w2.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.45.w3.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.46.w1.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.46.w2.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.46.w3.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.47.w1.weight": "consolidated-00147-of-00272.safetensors", + "layers.4.experts.47.w2.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.47.w3.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.48.w1.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.48.w2.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.48.w3.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.49.w1.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.49.w2.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.49.w3.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.5.w1.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.5.w2.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.5.w3.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.50.w1.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.50.w2.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.50.w3.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.51.w1.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.51.w2.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.51.w3.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.52.w1.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.52.w2.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.52.w3.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.53.w1.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.53.w2.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.53.w3.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.54.w1.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.54.w2.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.54.w3.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.55.w1.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.55.w2.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.55.w3.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.56.w1.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.56.w2.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.56.w3.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.57.w1.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.57.w2.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.57.w3.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.58.w1.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.58.w2.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.58.w3.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.59.w1.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.59.w2.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.59.w3.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.6.w1.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.6.w2.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.6.w3.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.60.w1.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.60.w2.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.60.w3.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.61.w1.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.61.w2.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.61.w3.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.62.w1.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.62.w2.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.62.w3.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.63.w1.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.63.w2.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.63.w3.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.64.w1.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.64.w2.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.64.w3.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.65.w1.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.65.w2.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.65.w3.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.66.w1.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.66.w2.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.66.w3.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.67.w1.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.67.w2.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.67.w3.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.68.w1.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.68.w2.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.68.w3.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.69.w1.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.69.w2.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.69.w3.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.7.w1.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.7.w2.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.7.w3.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.70.w1.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.70.w2.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.70.w3.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.71.w1.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.71.w2.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.71.w3.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.72.w1.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.72.w2.weight": "consolidated-00148-of-00272.safetensors", + "layers.4.experts.72.w3.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.73.w1.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.73.w2.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.73.w3.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.74.w1.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.74.w2.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.74.w3.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.75.w1.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.75.w2.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.75.w3.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.76.w1.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.76.w2.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.76.w3.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.77.w1.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.77.w2.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.77.w3.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.78.w1.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.78.w2.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.78.w3.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.79.w1.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.79.w2.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.79.w3.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.8.w1.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.8.w2.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.8.w3.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.80.w1.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.80.w2.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.80.w3.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.81.w1.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.81.w2.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.81.w3.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.82.w1.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.82.w2.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.82.w3.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.83.w1.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.83.w2.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.83.w3.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.84.w1.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.84.w2.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.84.w3.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.85.w1.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.85.w2.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.85.w3.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.86.w1.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.86.w2.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.86.w3.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.87.w1.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.87.w2.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.87.w3.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.88.w1.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.88.w2.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.88.w3.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.89.w1.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.89.w2.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.89.w3.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.9.w1.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.9.w2.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.9.w3.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.90.w1.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.90.w2.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.90.w3.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.91.w1.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.91.w2.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.91.w3.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.92.w1.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.92.w2.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.92.w3.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.93.w1.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.93.w2.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.93.w3.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.94.w1.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.94.w2.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.94.w3.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.95.w1.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.95.w2.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.95.w3.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.96.w1.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.96.w2.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.96.w3.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.97.w1.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.97.w2.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.97.w3.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.98.w1.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.98.w2.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.98.w3.weight": "consolidated-00149-of-00272.safetensors", + "layers.4.experts.99.w1.weight": "consolidated-00150-of-00272.safetensors", + "layers.4.experts.99.w2.weight": "consolidated-00150-of-00272.safetensors", + "layers.4.experts.99.w3.weight": "consolidated-00150-of-00272.safetensors", + "layers.4.ffn_norm.weight": "consolidated-00150-of-00272.safetensors", + "layers.4.gate.weight": "consolidated-00150-of-00272.safetensors", + "layers.4.shared_experts.w1.weight": "consolidated-00150-of-00272.safetensors", + "layers.4.shared_experts.w2.weight": "consolidated-00150-of-00272.safetensors", + "layers.4.shared_experts.w3.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.attention.kv_a_norm.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.attention.q_a_norm.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.attention.wkv_a_with_mqa.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.attention.wkv_b.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.attention.wo.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.attention.wq_a.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.attention.wq_b.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.attention_norm.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.0.w1.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.0.w2.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.0.w3.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.1.w1.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.1.w2.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.1.w3.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.10.w1.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.10.w2.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.10.w3.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.100.w1.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.100.w2.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.100.w3.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.101.w1.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.101.w2.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.101.w3.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.102.w1.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.102.w2.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.102.w3.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.103.w1.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.103.w2.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.103.w3.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.104.w1.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.104.w2.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.104.w3.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.105.w1.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.105.w2.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.105.w3.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.106.w1.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.106.w2.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.106.w3.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.107.w1.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.107.w2.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.107.w3.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.108.w1.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.108.w2.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.108.w3.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.109.w1.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.109.w2.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.109.w3.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.11.w1.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.11.w2.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.11.w3.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.110.w1.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.110.w2.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.110.w3.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.111.w1.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.111.w2.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.111.w3.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.112.w1.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.112.w2.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.112.w3.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.113.w1.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.113.w2.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.113.w3.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.114.w1.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.114.w2.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.114.w3.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.115.w1.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.115.w2.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.115.w3.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.116.w1.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.116.w2.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.116.w3.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.117.w1.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.117.w2.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.117.w3.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.118.w1.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.118.w2.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.118.w3.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.119.w1.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.119.w2.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.119.w3.weight": "consolidated-00150-of-00272.safetensors", + "layers.40.experts.12.w1.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.12.w2.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.12.w3.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.120.w1.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.120.w2.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.120.w3.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.121.w1.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.121.w2.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.121.w3.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.122.w1.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.122.w2.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.122.w3.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.123.w1.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.123.w2.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.123.w3.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.124.w1.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.124.w2.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.124.w3.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.125.w1.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.125.w2.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.125.w3.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.126.w1.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.126.w2.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.126.w3.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.127.w1.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.127.w2.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.127.w3.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.13.w1.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.13.w2.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.13.w3.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.14.w1.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.14.w2.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.14.w3.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.15.w1.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.15.w2.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.15.w3.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.16.w1.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.16.w2.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.16.w3.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.17.w1.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.17.w2.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.17.w3.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.18.w1.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.18.w2.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.18.w3.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.19.w1.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.19.w2.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.19.w3.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.2.w1.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.2.w2.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.2.w3.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.20.w1.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.20.w2.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.20.w3.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.21.w1.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.21.w2.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.21.w3.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.22.w1.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.22.w2.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.22.w3.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.23.w1.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.23.w2.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.23.w3.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.24.w1.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.24.w2.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.24.w3.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.25.w1.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.25.w2.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.25.w3.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.26.w1.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.26.w2.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.26.w3.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.27.w1.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.27.w2.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.27.w3.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.28.w1.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.28.w2.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.28.w3.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.29.w1.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.29.w2.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.29.w3.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.3.w1.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.3.w2.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.3.w3.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.30.w1.weight": "consolidated-00151-of-00272.safetensors", + "layers.40.experts.30.w2.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.30.w3.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.31.w1.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.31.w2.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.31.w3.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.32.w1.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.32.w2.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.32.w3.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.33.w1.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.33.w2.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.33.w3.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.34.w1.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.34.w2.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.34.w3.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.35.w1.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.35.w2.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.35.w3.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.36.w1.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.36.w2.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.36.w3.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.37.w1.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.37.w2.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.37.w3.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.38.w1.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.38.w2.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.38.w3.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.39.w1.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.39.w2.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.39.w3.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.4.w1.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.4.w2.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.4.w3.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.40.w1.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.40.w2.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.40.w3.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.41.w1.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.41.w2.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.41.w3.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.42.w1.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.42.w2.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.42.w3.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.43.w1.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.43.w2.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.43.w3.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.44.w1.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.44.w2.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.44.w3.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.45.w1.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.45.w2.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.45.w3.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.46.w1.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.46.w2.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.46.w3.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.47.w1.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.47.w2.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.47.w3.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.48.w1.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.48.w2.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.48.w3.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.49.w1.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.49.w2.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.49.w3.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.5.w1.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.5.w2.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.5.w3.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.50.w1.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.50.w2.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.50.w3.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.51.w1.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.51.w2.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.51.w3.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.52.w1.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.52.w2.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.52.w3.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.53.w1.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.53.w2.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.53.w3.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.54.w1.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.54.w2.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.54.w3.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.55.w1.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.55.w2.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.55.w3.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.56.w1.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.56.w2.weight": "consolidated-00152-of-00272.safetensors", + "layers.40.experts.56.w3.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.57.w1.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.57.w2.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.57.w3.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.58.w1.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.58.w2.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.58.w3.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.59.w1.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.59.w2.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.59.w3.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.6.w1.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.6.w2.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.6.w3.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.60.w1.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.60.w2.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.60.w3.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.61.w1.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.61.w2.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.61.w3.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.62.w1.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.62.w2.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.62.w3.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.63.w1.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.63.w2.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.63.w3.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.64.w1.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.64.w2.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.64.w3.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.65.w1.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.65.w2.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.65.w3.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.66.w1.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.66.w2.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.66.w3.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.67.w1.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.67.w2.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.67.w3.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.68.w1.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.68.w2.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.68.w3.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.69.w1.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.69.w2.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.69.w3.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.7.w1.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.7.w2.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.7.w3.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.70.w1.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.70.w2.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.70.w3.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.71.w1.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.71.w2.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.71.w3.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.72.w1.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.72.w2.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.72.w3.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.73.w1.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.73.w2.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.73.w3.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.74.w1.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.74.w2.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.74.w3.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.75.w1.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.75.w2.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.75.w3.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.76.w1.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.76.w2.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.76.w3.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.77.w1.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.77.w2.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.77.w3.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.78.w1.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.78.w2.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.78.w3.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.79.w1.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.79.w2.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.79.w3.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.8.w1.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.8.w2.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.8.w3.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.80.w1.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.80.w2.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.80.w3.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.81.w1.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.81.w2.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.81.w3.weight": "consolidated-00153-of-00272.safetensors", + "layers.40.experts.82.w1.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.82.w2.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.82.w3.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.83.w1.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.83.w2.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.83.w3.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.84.w1.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.84.w2.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.84.w3.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.85.w1.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.85.w2.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.85.w3.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.86.w1.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.86.w2.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.86.w3.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.87.w1.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.87.w2.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.87.w3.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.88.w1.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.88.w2.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.88.w3.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.89.w1.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.89.w2.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.89.w3.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.9.w1.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.9.w2.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.9.w3.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.90.w1.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.90.w2.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.90.w3.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.91.w1.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.91.w2.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.91.w3.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.92.w1.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.92.w2.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.92.w3.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.93.w1.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.93.w2.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.93.w3.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.94.w1.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.94.w2.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.94.w3.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.95.w1.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.95.w2.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.95.w3.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.96.w1.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.96.w2.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.96.w3.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.97.w1.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.97.w2.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.97.w3.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.98.w1.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.98.w2.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.98.w3.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.99.w1.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.99.w2.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.experts.99.w3.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.ffn_norm.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.gate.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.shared_experts.w1.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.shared_experts.w2.weight": "consolidated-00154-of-00272.safetensors", + "layers.40.shared_experts.w3.weight": "consolidated-00154-of-00272.safetensors", + "layers.41.attention.kv_a_norm.weight": "consolidated-00154-of-00272.safetensors", + "layers.41.attention.q_a_norm.weight": "consolidated-00154-of-00272.safetensors", + "layers.41.attention.wkv_a_with_mqa.weight": "consolidated-00154-of-00272.safetensors", + "layers.41.attention.wkv_b.weight": "consolidated-00154-of-00272.safetensors", + "layers.41.attention.wo.weight": "consolidated-00154-of-00272.safetensors", + "layers.41.attention.wq_a.weight": "consolidated-00154-of-00272.safetensors", + "layers.41.attention.wq_b.weight": "consolidated-00154-of-00272.safetensors", + "layers.41.attention_norm.weight": "consolidated-00154-of-00272.safetensors", + "layers.41.experts.0.w1.weight": "consolidated-00154-of-00272.safetensors", + "layers.41.experts.0.w2.weight": "consolidated-00154-of-00272.safetensors", + "layers.41.experts.0.w3.weight": "consolidated-00154-of-00272.safetensors", + "layers.41.experts.1.w1.weight": "consolidated-00154-of-00272.safetensors", + "layers.41.experts.1.w2.weight": "consolidated-00154-of-00272.safetensors", + "layers.41.experts.1.w3.weight": "consolidated-00154-of-00272.safetensors", + "layers.41.experts.10.w1.weight": "consolidated-00154-of-00272.safetensors", + "layers.41.experts.10.w2.weight": "consolidated-00154-of-00272.safetensors", + "layers.41.experts.10.w3.weight": "consolidated-00154-of-00272.safetensors", + "layers.41.experts.100.w1.weight": "consolidated-00154-of-00272.safetensors", + "layers.41.experts.100.w2.weight": "consolidated-00154-of-00272.safetensors", + "layers.41.experts.100.w3.weight": "consolidated-00154-of-00272.safetensors", + "layers.41.experts.101.w1.weight": "consolidated-00154-of-00272.safetensors", + "layers.41.experts.101.w2.weight": "consolidated-00154-of-00272.safetensors", + "layers.41.experts.101.w3.weight": "consolidated-00154-of-00272.safetensors", + "layers.41.experts.102.w1.weight": "consolidated-00154-of-00272.safetensors", + "layers.41.experts.102.w2.weight": "consolidated-00154-of-00272.safetensors", + "layers.41.experts.102.w3.weight": "consolidated-00154-of-00272.safetensors", + "layers.41.experts.103.w1.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.103.w2.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.103.w3.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.104.w1.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.104.w2.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.104.w3.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.105.w1.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.105.w2.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.105.w3.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.106.w1.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.106.w2.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.106.w3.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.107.w1.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.107.w2.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.107.w3.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.108.w1.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.108.w2.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.108.w3.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.109.w1.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.109.w2.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.109.w3.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.11.w1.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.11.w2.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.11.w3.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.110.w1.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.110.w2.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.110.w3.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.111.w1.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.111.w2.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.111.w3.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.112.w1.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.112.w2.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.112.w3.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.113.w1.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.113.w2.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.113.w3.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.114.w1.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.114.w2.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.114.w3.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.115.w1.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.115.w2.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.115.w3.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.116.w1.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.116.w2.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.116.w3.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.117.w1.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.117.w2.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.117.w3.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.118.w1.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.118.w2.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.118.w3.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.119.w1.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.119.w2.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.119.w3.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.12.w1.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.12.w2.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.12.w3.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.120.w1.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.120.w2.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.120.w3.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.121.w1.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.121.w2.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.121.w3.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.122.w1.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.122.w2.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.122.w3.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.123.w1.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.123.w2.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.123.w3.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.124.w1.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.124.w2.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.124.w3.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.125.w1.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.125.w2.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.125.w3.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.126.w1.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.126.w2.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.126.w3.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.127.w1.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.127.w2.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.127.w3.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.13.w1.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.13.w2.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.13.w3.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.14.w1.weight": "consolidated-00155-of-00272.safetensors", + "layers.41.experts.14.w2.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.14.w3.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.15.w1.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.15.w2.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.15.w3.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.16.w1.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.16.w2.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.16.w3.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.17.w1.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.17.w2.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.17.w3.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.18.w1.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.18.w2.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.18.w3.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.19.w1.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.19.w2.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.19.w3.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.2.w1.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.2.w2.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.2.w3.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.20.w1.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.20.w2.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.20.w3.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.21.w1.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.21.w2.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.21.w3.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.22.w1.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.22.w2.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.22.w3.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.23.w1.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.23.w2.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.23.w3.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.24.w1.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.24.w2.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.24.w3.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.25.w1.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.25.w2.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.25.w3.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.26.w1.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.26.w2.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.26.w3.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.27.w1.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.27.w2.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.27.w3.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.28.w1.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.28.w2.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.28.w3.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.29.w1.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.29.w2.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.29.w3.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.3.w1.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.3.w2.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.3.w3.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.30.w1.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.30.w2.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.30.w3.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.31.w1.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.31.w2.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.31.w3.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.32.w1.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.32.w2.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.32.w3.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.33.w1.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.33.w2.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.33.w3.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.34.w1.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.34.w2.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.34.w3.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.35.w1.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.35.w2.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.35.w3.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.36.w1.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.36.w2.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.36.w3.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.37.w1.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.37.w2.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.37.w3.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.38.w1.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.38.w2.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.38.w3.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.39.w1.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.39.w2.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.39.w3.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.4.w1.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.4.w2.weight": "consolidated-00156-of-00272.safetensors", + "layers.41.experts.4.w3.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.40.w1.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.40.w2.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.40.w3.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.41.w1.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.41.w2.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.41.w3.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.42.w1.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.42.w2.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.42.w3.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.43.w1.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.43.w2.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.43.w3.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.44.w1.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.44.w2.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.44.w3.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.45.w1.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.45.w2.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.45.w3.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.46.w1.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.46.w2.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.46.w3.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.47.w1.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.47.w2.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.47.w3.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.48.w1.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.48.w2.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.48.w3.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.49.w1.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.49.w2.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.49.w3.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.5.w1.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.5.w2.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.5.w3.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.50.w1.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.50.w2.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.50.w3.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.51.w1.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.51.w2.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.51.w3.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.52.w1.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.52.w2.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.52.w3.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.53.w1.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.53.w2.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.53.w3.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.54.w1.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.54.w2.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.54.w3.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.55.w1.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.55.w2.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.55.w3.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.56.w1.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.56.w2.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.56.w3.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.57.w1.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.57.w2.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.57.w3.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.58.w1.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.58.w2.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.58.w3.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.59.w1.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.59.w2.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.59.w3.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.6.w1.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.6.w2.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.6.w3.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.60.w1.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.60.w2.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.60.w3.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.61.w1.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.61.w2.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.61.w3.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.62.w1.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.62.w2.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.62.w3.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.63.w1.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.63.w2.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.63.w3.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.64.w1.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.64.w2.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.64.w3.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.65.w1.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.65.w2.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.65.w3.weight": "consolidated-00157-of-00272.safetensors", + "layers.41.experts.66.w1.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.66.w2.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.66.w3.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.67.w1.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.67.w2.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.67.w3.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.68.w1.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.68.w2.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.68.w3.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.69.w1.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.69.w2.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.69.w3.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.7.w1.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.7.w2.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.7.w3.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.70.w1.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.70.w2.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.70.w3.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.71.w1.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.71.w2.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.71.w3.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.72.w1.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.72.w2.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.72.w3.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.73.w1.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.73.w2.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.73.w3.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.74.w1.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.74.w2.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.74.w3.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.75.w1.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.75.w2.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.75.w3.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.76.w1.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.76.w2.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.76.w3.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.77.w1.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.77.w2.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.77.w3.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.78.w1.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.78.w2.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.78.w3.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.79.w1.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.79.w2.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.79.w3.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.8.w1.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.8.w2.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.8.w3.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.80.w1.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.80.w2.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.80.w3.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.81.w1.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.81.w2.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.81.w3.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.82.w1.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.82.w2.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.82.w3.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.83.w1.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.83.w2.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.83.w3.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.84.w1.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.84.w2.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.84.w3.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.85.w1.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.85.w2.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.85.w3.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.86.w1.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.86.w2.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.86.w3.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.87.w1.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.87.w2.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.87.w3.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.88.w1.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.88.w2.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.88.w3.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.89.w1.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.89.w2.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.89.w3.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.9.w1.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.9.w2.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.9.w3.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.90.w1.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.90.w2.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.90.w3.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.91.w1.weight": "consolidated-00158-of-00272.safetensors", + "layers.41.experts.91.w2.weight": "consolidated-00159-of-00272.safetensors", + "layers.41.experts.91.w3.weight": "consolidated-00159-of-00272.safetensors", + "layers.41.experts.92.w1.weight": "consolidated-00159-of-00272.safetensors", + "layers.41.experts.92.w2.weight": "consolidated-00159-of-00272.safetensors", + "layers.41.experts.92.w3.weight": "consolidated-00159-of-00272.safetensors", + "layers.41.experts.93.w1.weight": "consolidated-00159-of-00272.safetensors", + "layers.41.experts.93.w2.weight": "consolidated-00159-of-00272.safetensors", + "layers.41.experts.93.w3.weight": "consolidated-00159-of-00272.safetensors", + "layers.41.experts.94.w1.weight": "consolidated-00159-of-00272.safetensors", + "layers.41.experts.94.w2.weight": "consolidated-00159-of-00272.safetensors", + "layers.41.experts.94.w3.weight": "consolidated-00159-of-00272.safetensors", + "layers.41.experts.95.w1.weight": "consolidated-00159-of-00272.safetensors", + "layers.41.experts.95.w2.weight": "consolidated-00159-of-00272.safetensors", + "layers.41.experts.95.w3.weight": "consolidated-00159-of-00272.safetensors", + "layers.41.experts.96.w1.weight": "consolidated-00159-of-00272.safetensors", + "layers.41.experts.96.w2.weight": "consolidated-00159-of-00272.safetensors", + "layers.41.experts.96.w3.weight": "consolidated-00159-of-00272.safetensors", + "layers.41.experts.97.w1.weight": "consolidated-00159-of-00272.safetensors", + "layers.41.experts.97.w2.weight": "consolidated-00159-of-00272.safetensors", + "layers.41.experts.97.w3.weight": "consolidated-00159-of-00272.safetensors", + "layers.41.experts.98.w1.weight": "consolidated-00159-of-00272.safetensors", + "layers.41.experts.98.w2.weight": "consolidated-00159-of-00272.safetensors", + "layers.41.experts.98.w3.weight": "consolidated-00159-of-00272.safetensors", + "layers.41.experts.99.w1.weight": "consolidated-00159-of-00272.safetensors", + "layers.41.experts.99.w2.weight": "consolidated-00159-of-00272.safetensors", + "layers.41.experts.99.w3.weight": "consolidated-00159-of-00272.safetensors", + "layers.41.ffn_norm.weight": "consolidated-00159-of-00272.safetensors", + "layers.41.gate.weight": "consolidated-00159-of-00272.safetensors", + "layers.41.shared_experts.w1.weight": "consolidated-00159-of-00272.safetensors", + "layers.41.shared_experts.w2.weight": "consolidated-00159-of-00272.safetensors", + "layers.41.shared_experts.w3.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.attention.kv_a_norm.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.attention.q_a_norm.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.attention.wkv_a_with_mqa.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.attention.wkv_b.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.attention.wo.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.attention.wq_a.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.attention.wq_b.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.attention_norm.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.0.w1.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.0.w2.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.0.w3.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.1.w1.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.1.w2.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.1.w3.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.10.w1.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.10.w2.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.10.w3.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.100.w1.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.100.w2.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.100.w3.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.101.w1.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.101.w2.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.101.w3.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.102.w1.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.102.w2.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.102.w3.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.103.w1.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.103.w2.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.103.w3.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.104.w1.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.104.w2.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.104.w3.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.105.w1.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.105.w2.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.105.w3.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.106.w1.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.106.w2.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.106.w3.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.107.w1.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.107.w2.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.107.w3.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.108.w1.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.108.w2.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.108.w3.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.109.w1.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.109.w2.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.109.w3.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.11.w1.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.11.w2.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.11.w3.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.110.w1.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.110.w2.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.110.w3.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.111.w1.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.111.w2.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.111.w3.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.112.w1.weight": "consolidated-00159-of-00272.safetensors", + "layers.42.experts.112.w2.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.112.w3.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.113.w1.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.113.w2.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.113.w3.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.114.w1.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.114.w2.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.114.w3.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.115.w1.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.115.w2.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.115.w3.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.116.w1.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.116.w2.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.116.w3.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.117.w1.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.117.w2.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.117.w3.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.118.w1.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.118.w2.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.118.w3.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.119.w1.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.119.w2.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.119.w3.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.12.w1.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.12.w2.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.12.w3.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.120.w1.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.120.w2.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.120.w3.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.121.w1.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.121.w2.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.121.w3.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.122.w1.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.122.w2.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.122.w3.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.123.w1.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.123.w2.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.123.w3.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.124.w1.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.124.w2.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.124.w3.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.125.w1.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.125.w2.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.125.w3.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.126.w1.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.126.w2.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.126.w3.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.127.w1.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.127.w2.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.127.w3.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.13.w1.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.13.w2.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.13.w3.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.14.w1.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.14.w2.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.14.w3.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.15.w1.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.15.w2.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.15.w3.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.16.w1.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.16.w2.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.16.w3.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.17.w1.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.17.w2.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.17.w3.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.18.w1.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.18.w2.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.18.w3.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.19.w1.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.19.w2.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.19.w3.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.2.w1.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.2.w2.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.2.w3.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.20.w1.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.20.w2.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.20.w3.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.21.w1.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.21.w2.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.21.w3.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.22.w1.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.22.w2.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.22.w3.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.23.w1.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.23.w2.weight": "consolidated-00160-of-00272.safetensors", + "layers.42.experts.23.w3.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.24.w1.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.24.w2.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.24.w3.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.25.w1.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.25.w2.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.25.w3.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.26.w1.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.26.w2.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.26.w3.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.27.w1.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.27.w2.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.27.w3.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.28.w1.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.28.w2.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.28.w3.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.29.w1.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.29.w2.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.29.w3.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.3.w1.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.3.w2.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.3.w3.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.30.w1.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.30.w2.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.30.w3.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.31.w1.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.31.w2.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.31.w3.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.32.w1.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.32.w2.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.32.w3.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.33.w1.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.33.w2.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.33.w3.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.34.w1.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.34.w2.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.34.w3.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.35.w1.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.35.w2.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.35.w3.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.36.w1.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.36.w2.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.36.w3.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.37.w1.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.37.w2.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.37.w3.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.38.w1.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.38.w2.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.38.w3.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.39.w1.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.39.w2.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.39.w3.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.4.w1.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.4.w2.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.4.w3.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.40.w1.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.40.w2.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.40.w3.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.41.w1.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.41.w2.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.41.w3.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.42.w1.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.42.w2.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.42.w3.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.43.w1.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.43.w2.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.43.w3.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.44.w1.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.44.w2.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.44.w3.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.45.w1.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.45.w2.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.45.w3.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.46.w1.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.46.w2.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.46.w3.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.47.w1.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.47.w2.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.47.w3.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.48.w1.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.48.w2.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.48.w3.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.49.w1.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.49.w2.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.49.w3.weight": "consolidated-00161-of-00272.safetensors", + "layers.42.experts.5.w1.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.5.w2.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.5.w3.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.50.w1.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.50.w2.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.50.w3.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.51.w1.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.51.w2.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.51.w3.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.52.w1.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.52.w2.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.52.w3.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.53.w1.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.53.w2.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.53.w3.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.54.w1.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.54.w2.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.54.w3.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.55.w1.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.55.w2.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.55.w3.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.56.w1.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.56.w2.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.56.w3.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.57.w1.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.57.w2.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.57.w3.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.58.w1.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.58.w2.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.58.w3.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.59.w1.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.59.w2.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.59.w3.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.6.w1.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.6.w2.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.6.w3.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.60.w1.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.60.w2.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.60.w3.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.61.w1.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.61.w2.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.61.w3.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.62.w1.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.62.w2.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.62.w3.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.63.w1.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.63.w2.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.63.w3.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.64.w1.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.64.w2.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.64.w3.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.65.w1.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.65.w2.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.65.w3.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.66.w1.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.66.w2.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.66.w3.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.67.w1.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.67.w2.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.67.w3.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.68.w1.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.68.w2.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.68.w3.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.69.w1.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.69.w2.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.69.w3.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.7.w1.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.7.w2.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.7.w3.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.70.w1.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.70.w2.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.70.w3.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.71.w1.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.71.w2.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.71.w3.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.72.w1.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.72.w2.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.72.w3.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.73.w1.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.73.w2.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.73.w3.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.74.w1.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.74.w2.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.74.w3.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.75.w1.weight": "consolidated-00162-of-00272.safetensors", + "layers.42.experts.75.w2.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.75.w3.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.76.w1.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.76.w2.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.76.w3.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.77.w1.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.77.w2.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.77.w3.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.78.w1.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.78.w2.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.78.w3.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.79.w1.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.79.w2.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.79.w3.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.8.w1.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.8.w2.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.8.w3.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.80.w1.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.80.w2.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.80.w3.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.81.w1.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.81.w2.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.81.w3.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.82.w1.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.82.w2.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.82.w3.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.83.w1.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.83.w2.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.83.w3.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.84.w1.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.84.w2.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.84.w3.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.85.w1.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.85.w2.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.85.w3.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.86.w1.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.86.w2.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.86.w3.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.87.w1.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.87.w2.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.87.w3.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.88.w1.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.88.w2.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.88.w3.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.89.w1.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.89.w2.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.89.w3.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.9.w1.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.9.w2.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.9.w3.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.90.w1.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.90.w2.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.90.w3.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.91.w1.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.91.w2.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.91.w3.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.92.w1.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.92.w2.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.92.w3.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.93.w1.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.93.w2.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.93.w3.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.94.w1.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.94.w2.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.94.w3.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.95.w1.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.95.w2.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.95.w3.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.96.w1.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.96.w2.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.96.w3.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.97.w1.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.97.w2.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.97.w3.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.98.w1.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.98.w2.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.98.w3.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.99.w1.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.99.w2.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.experts.99.w3.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.ffn_norm.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.gate.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.shared_experts.w1.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.shared_experts.w2.weight": "consolidated-00163-of-00272.safetensors", + "layers.42.shared_experts.w3.weight": "consolidated-00163-of-00272.safetensors", + "layers.43.attention.kv_a_norm.weight": "consolidated-00163-of-00272.safetensors", + "layers.43.attention.q_a_norm.weight": "consolidated-00163-of-00272.safetensors", + "layers.43.attention.wkv_a_with_mqa.weight": "consolidated-00163-of-00272.safetensors", + "layers.43.attention.wkv_b.weight": "consolidated-00163-of-00272.safetensors", + "layers.43.attention.wo.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.attention.wq_a.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.attention.wq_b.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.attention_norm.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.0.w1.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.0.w2.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.0.w3.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.1.w1.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.1.w2.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.1.w3.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.10.w1.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.10.w2.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.10.w3.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.100.w1.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.100.w2.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.100.w3.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.101.w1.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.101.w2.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.101.w3.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.102.w1.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.102.w2.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.102.w3.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.103.w1.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.103.w2.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.103.w3.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.104.w1.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.104.w2.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.104.w3.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.105.w1.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.105.w2.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.105.w3.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.106.w1.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.106.w2.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.106.w3.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.107.w1.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.107.w2.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.107.w3.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.108.w1.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.108.w2.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.108.w3.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.109.w1.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.109.w2.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.109.w3.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.11.w1.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.11.w2.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.11.w3.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.110.w1.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.110.w2.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.110.w3.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.111.w1.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.111.w2.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.111.w3.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.112.w1.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.112.w2.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.112.w3.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.113.w1.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.113.w2.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.113.w3.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.114.w1.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.114.w2.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.114.w3.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.115.w1.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.115.w2.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.115.w3.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.116.w1.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.116.w2.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.116.w3.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.117.w1.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.117.w2.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.117.w3.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.118.w1.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.118.w2.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.118.w3.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.119.w1.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.119.w2.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.119.w3.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.12.w1.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.12.w2.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.12.w3.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.120.w1.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.120.w2.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.120.w3.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.121.w1.weight": "consolidated-00164-of-00272.safetensors", + "layers.43.experts.121.w2.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.121.w3.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.122.w1.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.122.w2.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.122.w3.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.123.w1.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.123.w2.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.123.w3.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.124.w1.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.124.w2.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.124.w3.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.125.w1.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.125.w2.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.125.w3.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.126.w1.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.126.w2.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.126.w3.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.127.w1.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.127.w2.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.127.w3.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.13.w1.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.13.w2.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.13.w3.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.14.w1.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.14.w2.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.14.w3.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.15.w1.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.15.w2.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.15.w3.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.16.w1.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.16.w2.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.16.w3.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.17.w1.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.17.w2.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.17.w3.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.18.w1.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.18.w2.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.18.w3.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.19.w1.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.19.w2.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.19.w3.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.2.w1.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.2.w2.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.2.w3.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.20.w1.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.20.w2.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.20.w3.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.21.w1.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.21.w2.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.21.w3.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.22.w1.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.22.w2.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.22.w3.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.23.w1.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.23.w2.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.23.w3.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.24.w1.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.24.w2.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.24.w3.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.25.w1.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.25.w2.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.25.w3.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.26.w1.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.26.w2.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.26.w3.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.27.w1.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.27.w2.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.27.w3.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.28.w1.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.28.w2.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.28.w3.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.29.w1.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.29.w2.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.29.w3.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.3.w1.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.3.w2.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.3.w3.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.30.w1.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.30.w2.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.30.w3.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.31.w1.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.31.w2.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.31.w3.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.32.w1.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.32.w2.weight": "consolidated-00165-of-00272.safetensors", + "layers.43.experts.32.w3.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.33.w1.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.33.w2.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.33.w3.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.34.w1.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.34.w2.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.34.w3.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.35.w1.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.35.w2.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.35.w3.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.36.w1.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.36.w2.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.36.w3.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.37.w1.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.37.w2.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.37.w3.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.38.w1.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.38.w2.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.38.w3.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.39.w1.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.39.w2.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.39.w3.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.4.w1.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.4.w2.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.4.w3.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.40.w1.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.40.w2.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.40.w3.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.41.w1.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.41.w2.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.41.w3.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.42.w1.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.42.w2.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.42.w3.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.43.w1.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.43.w2.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.43.w3.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.44.w1.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.44.w2.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.44.w3.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.45.w1.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.45.w2.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.45.w3.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.46.w1.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.46.w2.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.46.w3.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.47.w1.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.47.w2.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.47.w3.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.48.w1.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.48.w2.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.48.w3.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.49.w1.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.49.w2.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.49.w3.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.5.w1.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.5.w2.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.5.w3.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.50.w1.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.50.w2.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.50.w3.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.51.w1.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.51.w2.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.51.w3.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.52.w1.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.52.w2.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.52.w3.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.53.w1.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.53.w2.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.53.w3.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.54.w1.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.54.w2.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.54.w3.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.55.w1.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.55.w2.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.55.w3.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.56.w1.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.56.w2.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.56.w3.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.57.w1.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.57.w2.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.57.w3.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.58.w1.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.58.w2.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.58.w3.weight": "consolidated-00166-of-00272.safetensors", + "layers.43.experts.59.w1.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.59.w2.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.59.w3.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.6.w1.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.6.w2.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.6.w3.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.60.w1.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.60.w2.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.60.w3.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.61.w1.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.61.w2.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.61.w3.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.62.w1.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.62.w2.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.62.w3.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.63.w1.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.63.w2.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.63.w3.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.64.w1.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.64.w2.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.64.w3.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.65.w1.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.65.w2.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.65.w3.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.66.w1.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.66.w2.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.66.w3.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.67.w1.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.67.w2.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.67.w3.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.68.w1.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.68.w2.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.68.w3.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.69.w1.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.69.w2.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.69.w3.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.7.w1.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.7.w2.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.7.w3.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.70.w1.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.70.w2.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.70.w3.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.71.w1.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.71.w2.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.71.w3.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.72.w1.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.72.w2.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.72.w3.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.73.w1.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.73.w2.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.73.w3.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.74.w1.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.74.w2.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.74.w3.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.75.w1.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.75.w2.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.75.w3.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.76.w1.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.76.w2.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.76.w3.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.77.w1.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.77.w2.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.77.w3.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.78.w1.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.78.w2.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.78.w3.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.79.w1.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.79.w2.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.79.w3.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.8.w1.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.8.w2.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.8.w3.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.80.w1.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.80.w2.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.80.w3.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.81.w1.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.81.w2.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.81.w3.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.82.w1.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.82.w2.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.82.w3.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.83.w1.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.83.w2.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.83.w3.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.84.w1.weight": "consolidated-00167-of-00272.safetensors", + "layers.43.experts.84.w2.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.84.w3.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.85.w1.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.85.w2.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.85.w3.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.86.w1.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.86.w2.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.86.w3.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.87.w1.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.87.w2.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.87.w3.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.88.w1.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.88.w2.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.88.w3.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.89.w1.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.89.w2.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.89.w3.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.9.w1.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.9.w2.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.9.w3.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.90.w1.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.90.w2.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.90.w3.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.91.w1.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.91.w2.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.91.w3.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.92.w1.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.92.w2.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.92.w3.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.93.w1.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.93.w2.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.93.w3.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.94.w1.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.94.w2.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.94.w3.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.95.w1.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.95.w2.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.95.w3.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.96.w1.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.96.w2.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.96.w3.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.97.w1.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.97.w2.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.97.w3.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.98.w1.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.98.w2.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.98.w3.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.99.w1.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.99.w2.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.experts.99.w3.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.ffn_norm.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.gate.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.shared_experts.w1.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.shared_experts.w2.weight": "consolidated-00168-of-00272.safetensors", + "layers.43.shared_experts.w3.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.attention.kv_a_norm.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.attention.q_a_norm.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.attention.wkv_a_with_mqa.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.attention.wkv_b.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.attention.wo.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.attention.wq_a.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.attention.wq_b.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.attention_norm.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.experts.0.w1.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.experts.0.w2.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.experts.0.w3.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.experts.1.w1.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.experts.1.w2.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.experts.1.w3.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.experts.10.w1.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.experts.10.w2.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.experts.10.w3.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.experts.100.w1.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.experts.100.w2.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.experts.100.w3.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.experts.101.w1.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.experts.101.w2.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.experts.101.w3.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.experts.102.w1.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.experts.102.w2.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.experts.102.w3.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.experts.103.w1.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.experts.103.w2.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.experts.103.w3.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.experts.104.w1.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.experts.104.w2.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.experts.104.w3.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.experts.105.w1.weight": "consolidated-00168-of-00272.safetensors", + "layers.44.experts.105.w2.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.105.w3.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.106.w1.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.106.w2.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.106.w3.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.107.w1.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.107.w2.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.107.w3.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.108.w1.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.108.w2.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.108.w3.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.109.w1.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.109.w2.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.109.w3.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.11.w1.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.11.w2.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.11.w3.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.110.w1.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.110.w2.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.110.w3.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.111.w1.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.111.w2.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.111.w3.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.112.w1.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.112.w2.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.112.w3.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.113.w1.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.113.w2.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.113.w3.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.114.w1.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.114.w2.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.114.w3.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.115.w1.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.115.w2.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.115.w3.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.116.w1.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.116.w2.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.116.w3.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.117.w1.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.117.w2.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.117.w3.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.118.w1.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.118.w2.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.118.w3.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.119.w1.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.119.w2.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.119.w3.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.12.w1.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.12.w2.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.12.w3.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.120.w1.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.120.w2.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.120.w3.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.121.w1.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.121.w2.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.121.w3.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.122.w1.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.122.w2.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.122.w3.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.123.w1.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.123.w2.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.123.w3.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.124.w1.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.124.w2.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.124.w3.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.125.w1.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.125.w2.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.125.w3.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.126.w1.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.126.w2.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.126.w3.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.127.w1.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.127.w2.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.127.w3.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.13.w1.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.13.w2.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.13.w3.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.14.w1.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.14.w2.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.14.w3.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.15.w1.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.15.w2.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.15.w3.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.16.w1.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.16.w2.weight": "consolidated-00169-of-00272.safetensors", + "layers.44.experts.16.w3.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.17.w1.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.17.w2.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.17.w3.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.18.w1.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.18.w2.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.18.w3.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.19.w1.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.19.w2.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.19.w3.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.2.w1.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.2.w2.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.2.w3.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.20.w1.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.20.w2.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.20.w3.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.21.w1.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.21.w2.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.21.w3.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.22.w1.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.22.w2.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.22.w3.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.23.w1.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.23.w2.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.23.w3.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.24.w1.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.24.w2.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.24.w3.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.25.w1.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.25.w2.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.25.w3.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.26.w1.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.26.w2.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.26.w3.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.27.w1.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.27.w2.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.27.w3.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.28.w1.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.28.w2.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.28.w3.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.29.w1.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.29.w2.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.29.w3.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.3.w1.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.3.w2.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.3.w3.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.30.w1.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.30.w2.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.30.w3.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.31.w1.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.31.w2.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.31.w3.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.32.w1.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.32.w2.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.32.w3.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.33.w1.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.33.w2.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.33.w3.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.34.w1.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.34.w2.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.34.w3.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.35.w1.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.35.w2.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.35.w3.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.36.w1.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.36.w2.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.36.w3.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.37.w1.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.37.w2.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.37.w3.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.38.w1.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.38.w2.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.38.w3.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.39.w1.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.39.w2.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.39.w3.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.4.w1.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.4.w2.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.4.w3.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.40.w1.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.40.w2.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.40.w3.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.41.w1.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.41.w2.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.41.w3.weight": "consolidated-00170-of-00272.safetensors", + "layers.44.experts.42.w1.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.42.w2.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.42.w3.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.43.w1.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.43.w2.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.43.w3.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.44.w1.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.44.w2.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.44.w3.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.45.w1.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.45.w2.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.45.w3.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.46.w1.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.46.w2.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.46.w3.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.47.w1.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.47.w2.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.47.w3.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.48.w1.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.48.w2.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.48.w3.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.49.w1.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.49.w2.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.49.w3.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.5.w1.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.5.w2.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.5.w3.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.50.w1.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.50.w2.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.50.w3.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.51.w1.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.51.w2.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.51.w3.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.52.w1.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.52.w2.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.52.w3.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.53.w1.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.53.w2.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.53.w3.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.54.w1.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.54.w2.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.54.w3.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.55.w1.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.55.w2.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.55.w3.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.56.w1.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.56.w2.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.56.w3.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.57.w1.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.57.w2.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.57.w3.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.58.w1.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.58.w2.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.58.w3.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.59.w1.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.59.w2.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.59.w3.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.6.w1.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.6.w2.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.6.w3.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.60.w1.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.60.w2.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.60.w3.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.61.w1.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.61.w2.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.61.w3.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.62.w1.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.62.w2.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.62.w3.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.63.w1.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.63.w2.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.63.w3.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.64.w1.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.64.w2.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.64.w3.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.65.w1.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.65.w2.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.65.w3.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.66.w1.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.66.w2.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.66.w3.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.67.w1.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.67.w2.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.67.w3.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.68.w1.weight": "consolidated-00171-of-00272.safetensors", + "layers.44.experts.68.w2.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.68.w3.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.69.w1.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.69.w2.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.69.w3.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.7.w1.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.7.w2.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.7.w3.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.70.w1.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.70.w2.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.70.w3.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.71.w1.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.71.w2.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.71.w3.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.72.w1.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.72.w2.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.72.w3.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.73.w1.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.73.w2.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.73.w3.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.74.w1.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.74.w2.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.74.w3.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.75.w1.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.75.w2.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.75.w3.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.76.w1.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.76.w2.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.76.w3.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.77.w1.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.77.w2.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.77.w3.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.78.w1.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.78.w2.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.78.w3.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.79.w1.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.79.w2.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.79.w3.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.8.w1.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.8.w2.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.8.w3.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.80.w1.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.80.w2.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.80.w3.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.81.w1.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.81.w2.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.81.w3.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.82.w1.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.82.w2.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.82.w3.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.83.w1.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.83.w2.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.83.w3.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.84.w1.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.84.w2.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.84.w3.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.85.w1.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.85.w2.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.85.w3.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.86.w1.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.86.w2.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.86.w3.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.87.w1.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.87.w2.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.87.w3.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.88.w1.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.88.w2.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.88.w3.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.89.w1.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.89.w2.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.89.w3.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.9.w1.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.9.w2.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.9.w3.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.90.w1.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.90.w2.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.90.w3.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.91.w1.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.91.w2.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.91.w3.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.92.w1.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.92.w2.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.92.w3.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.93.w1.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.93.w2.weight": "consolidated-00172-of-00272.safetensors", + "layers.44.experts.93.w3.weight": "consolidated-00173-of-00272.safetensors", + "layers.44.experts.94.w1.weight": "consolidated-00173-of-00272.safetensors", + "layers.44.experts.94.w2.weight": "consolidated-00173-of-00272.safetensors", + "layers.44.experts.94.w3.weight": "consolidated-00173-of-00272.safetensors", + "layers.44.experts.95.w1.weight": "consolidated-00173-of-00272.safetensors", + "layers.44.experts.95.w2.weight": "consolidated-00173-of-00272.safetensors", + "layers.44.experts.95.w3.weight": "consolidated-00173-of-00272.safetensors", + "layers.44.experts.96.w1.weight": "consolidated-00173-of-00272.safetensors", + "layers.44.experts.96.w2.weight": "consolidated-00173-of-00272.safetensors", + "layers.44.experts.96.w3.weight": "consolidated-00173-of-00272.safetensors", + "layers.44.experts.97.w1.weight": "consolidated-00173-of-00272.safetensors", + "layers.44.experts.97.w2.weight": "consolidated-00173-of-00272.safetensors", + "layers.44.experts.97.w3.weight": "consolidated-00173-of-00272.safetensors", + "layers.44.experts.98.w1.weight": "consolidated-00173-of-00272.safetensors", + "layers.44.experts.98.w2.weight": "consolidated-00173-of-00272.safetensors", + "layers.44.experts.98.w3.weight": "consolidated-00173-of-00272.safetensors", + "layers.44.experts.99.w1.weight": "consolidated-00173-of-00272.safetensors", + "layers.44.experts.99.w2.weight": "consolidated-00173-of-00272.safetensors", + "layers.44.experts.99.w3.weight": "consolidated-00173-of-00272.safetensors", + "layers.44.ffn_norm.weight": "consolidated-00173-of-00272.safetensors", + "layers.44.gate.weight": "consolidated-00173-of-00272.safetensors", + "layers.44.shared_experts.w1.weight": "consolidated-00173-of-00272.safetensors", + "layers.44.shared_experts.w2.weight": "consolidated-00173-of-00272.safetensors", + "layers.44.shared_experts.w3.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.attention.kv_a_norm.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.attention.q_a_norm.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.attention.wkv_a_with_mqa.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.attention.wkv_b.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.attention.wo.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.attention.wq_a.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.attention.wq_b.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.attention_norm.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.0.w1.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.0.w2.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.0.w3.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.1.w1.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.1.w2.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.1.w3.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.10.w1.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.10.w2.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.10.w3.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.100.w1.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.100.w2.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.100.w3.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.101.w1.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.101.w2.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.101.w3.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.102.w1.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.102.w2.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.102.w3.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.103.w1.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.103.w2.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.103.w3.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.104.w1.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.104.w2.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.104.w3.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.105.w1.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.105.w2.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.105.w3.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.106.w1.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.106.w2.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.106.w3.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.107.w1.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.107.w2.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.107.w3.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.108.w1.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.108.w2.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.108.w3.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.109.w1.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.109.w2.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.109.w3.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.11.w1.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.11.w2.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.11.w3.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.110.w1.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.110.w2.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.110.w3.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.111.w1.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.111.w2.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.111.w3.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.112.w1.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.112.w2.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.112.w3.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.113.w1.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.113.w2.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.113.w3.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.114.w1.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.114.w2.weight": "consolidated-00173-of-00272.safetensors", + "layers.45.experts.114.w3.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.115.w1.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.115.w2.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.115.w3.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.116.w1.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.116.w2.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.116.w3.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.117.w1.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.117.w2.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.117.w3.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.118.w1.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.118.w2.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.118.w3.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.119.w1.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.119.w2.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.119.w3.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.12.w1.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.12.w2.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.12.w3.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.120.w1.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.120.w2.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.120.w3.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.121.w1.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.121.w2.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.121.w3.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.122.w1.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.122.w2.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.122.w3.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.123.w1.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.123.w2.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.123.w3.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.124.w1.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.124.w2.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.124.w3.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.125.w1.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.125.w2.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.125.w3.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.126.w1.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.126.w2.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.126.w3.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.127.w1.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.127.w2.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.127.w3.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.13.w1.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.13.w2.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.13.w3.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.14.w1.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.14.w2.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.14.w3.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.15.w1.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.15.w2.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.15.w3.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.16.w1.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.16.w2.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.16.w3.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.17.w1.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.17.w2.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.17.w3.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.18.w1.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.18.w2.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.18.w3.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.19.w1.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.19.w2.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.19.w3.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.2.w1.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.2.w2.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.2.w3.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.20.w1.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.20.w2.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.20.w3.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.21.w1.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.21.w2.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.21.w3.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.22.w1.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.22.w2.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.22.w3.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.23.w1.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.23.w2.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.23.w3.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.24.w1.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.24.w2.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.24.w3.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.25.w1.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.25.w2.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.25.w3.weight": "consolidated-00174-of-00272.safetensors", + "layers.45.experts.26.w1.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.26.w2.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.26.w3.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.27.w1.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.27.w2.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.27.w3.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.28.w1.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.28.w2.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.28.w3.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.29.w1.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.29.w2.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.29.w3.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.3.w1.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.3.w2.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.3.w3.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.30.w1.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.30.w2.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.30.w3.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.31.w1.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.31.w2.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.31.w3.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.32.w1.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.32.w2.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.32.w3.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.33.w1.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.33.w2.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.33.w3.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.34.w1.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.34.w2.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.34.w3.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.35.w1.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.35.w2.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.35.w3.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.36.w1.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.36.w2.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.36.w3.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.37.w1.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.37.w2.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.37.w3.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.38.w1.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.38.w2.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.38.w3.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.39.w1.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.39.w2.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.39.w3.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.4.w1.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.4.w2.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.4.w3.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.40.w1.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.40.w2.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.40.w3.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.41.w1.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.41.w2.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.41.w3.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.42.w1.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.42.w2.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.42.w3.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.43.w1.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.43.w2.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.43.w3.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.44.w1.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.44.w2.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.44.w3.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.45.w1.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.45.w2.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.45.w3.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.46.w1.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.46.w2.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.46.w3.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.47.w1.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.47.w2.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.47.w3.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.48.w1.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.48.w2.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.48.w3.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.49.w1.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.49.w2.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.49.w3.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.5.w1.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.5.w2.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.5.w3.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.50.w1.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.50.w2.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.50.w3.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.51.w1.weight": "consolidated-00175-of-00272.safetensors", + "layers.45.experts.51.w2.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.51.w3.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.52.w1.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.52.w2.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.52.w3.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.53.w1.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.53.w2.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.53.w3.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.54.w1.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.54.w2.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.54.w3.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.55.w1.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.55.w2.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.55.w3.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.56.w1.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.56.w2.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.56.w3.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.57.w1.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.57.w2.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.57.w3.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.58.w1.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.58.w2.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.58.w3.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.59.w1.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.59.w2.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.59.w3.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.6.w1.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.6.w2.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.6.w3.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.60.w1.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.60.w2.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.60.w3.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.61.w1.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.61.w2.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.61.w3.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.62.w1.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.62.w2.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.62.w3.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.63.w1.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.63.w2.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.63.w3.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.64.w1.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.64.w2.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.64.w3.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.65.w1.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.65.w2.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.65.w3.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.66.w1.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.66.w2.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.66.w3.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.67.w1.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.67.w2.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.67.w3.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.68.w1.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.68.w2.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.68.w3.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.69.w1.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.69.w2.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.69.w3.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.7.w1.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.7.w2.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.7.w3.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.70.w1.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.70.w2.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.70.w3.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.71.w1.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.71.w2.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.71.w3.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.72.w1.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.72.w2.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.72.w3.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.73.w1.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.73.w2.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.73.w3.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.74.w1.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.74.w2.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.74.w3.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.75.w1.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.75.w2.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.75.w3.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.76.w1.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.76.w2.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.76.w3.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.77.w1.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.77.w2.weight": "consolidated-00176-of-00272.safetensors", + "layers.45.experts.77.w3.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.78.w1.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.78.w2.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.78.w3.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.79.w1.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.79.w2.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.79.w3.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.8.w1.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.8.w2.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.8.w3.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.80.w1.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.80.w2.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.80.w3.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.81.w1.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.81.w2.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.81.w3.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.82.w1.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.82.w2.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.82.w3.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.83.w1.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.83.w2.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.83.w3.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.84.w1.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.84.w2.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.84.w3.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.85.w1.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.85.w2.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.85.w3.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.86.w1.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.86.w2.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.86.w3.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.87.w1.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.87.w2.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.87.w3.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.88.w1.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.88.w2.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.88.w3.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.89.w1.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.89.w2.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.89.w3.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.9.w1.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.9.w2.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.9.w3.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.90.w1.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.90.w2.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.90.w3.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.91.w1.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.91.w2.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.91.w3.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.92.w1.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.92.w2.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.92.w3.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.93.w1.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.93.w2.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.93.w3.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.94.w1.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.94.w2.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.94.w3.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.95.w1.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.95.w2.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.95.w3.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.96.w1.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.96.w2.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.96.w3.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.97.w1.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.97.w2.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.97.w3.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.98.w1.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.98.w2.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.98.w3.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.99.w1.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.99.w2.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.experts.99.w3.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.ffn_norm.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.gate.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.shared_experts.w1.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.shared_experts.w2.weight": "consolidated-00177-of-00272.safetensors", + "layers.45.shared_experts.w3.weight": "consolidated-00177-of-00272.safetensors", + "layers.46.attention.kv_a_norm.weight": "consolidated-00177-of-00272.safetensors", + "layers.46.attention.q_a_norm.weight": "consolidated-00177-of-00272.safetensors", + "layers.46.attention.wkv_a_with_mqa.weight": "consolidated-00177-of-00272.safetensors", + "layers.46.attention.wkv_b.weight": "consolidated-00177-of-00272.safetensors", + "layers.46.attention.wo.weight": "consolidated-00177-of-00272.safetensors", + "layers.46.attention.wq_a.weight": "consolidated-00177-of-00272.safetensors", + "layers.46.attention.wq_b.weight": "consolidated-00177-of-00272.safetensors", + "layers.46.attention_norm.weight": "consolidated-00177-of-00272.safetensors", + "layers.46.experts.0.w1.weight": "consolidated-00177-of-00272.safetensors", + "layers.46.experts.0.w2.weight": "consolidated-00177-of-00272.safetensors", + "layers.46.experts.0.w3.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.1.w1.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.1.w2.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.1.w3.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.10.w1.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.10.w2.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.10.w3.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.100.w1.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.100.w2.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.100.w3.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.101.w1.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.101.w2.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.101.w3.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.102.w1.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.102.w2.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.102.w3.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.103.w1.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.103.w2.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.103.w3.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.104.w1.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.104.w2.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.104.w3.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.105.w1.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.105.w2.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.105.w3.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.106.w1.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.106.w2.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.106.w3.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.107.w1.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.107.w2.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.107.w3.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.108.w1.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.108.w2.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.108.w3.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.109.w1.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.109.w2.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.109.w3.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.11.w1.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.11.w2.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.11.w3.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.110.w1.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.110.w2.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.110.w3.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.111.w1.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.111.w2.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.111.w3.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.112.w1.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.112.w2.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.112.w3.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.113.w1.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.113.w2.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.113.w3.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.114.w1.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.114.w2.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.114.w3.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.115.w1.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.115.w2.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.115.w3.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.116.w1.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.116.w2.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.116.w3.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.117.w1.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.117.w2.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.117.w3.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.118.w1.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.118.w2.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.118.w3.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.119.w1.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.119.w2.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.119.w3.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.12.w1.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.12.w2.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.12.w3.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.120.w1.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.120.w2.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.120.w3.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.121.w1.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.121.w2.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.121.w3.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.122.w1.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.122.w2.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.122.w3.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.123.w1.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.123.w2.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.123.w3.weight": "consolidated-00178-of-00272.safetensors", + "layers.46.experts.124.w1.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.124.w2.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.124.w3.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.125.w1.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.125.w2.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.125.w3.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.126.w1.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.126.w2.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.126.w3.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.127.w1.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.127.w2.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.127.w3.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.13.w1.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.13.w2.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.13.w3.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.14.w1.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.14.w2.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.14.w3.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.15.w1.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.15.w2.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.15.w3.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.16.w1.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.16.w2.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.16.w3.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.17.w1.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.17.w2.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.17.w3.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.18.w1.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.18.w2.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.18.w3.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.19.w1.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.19.w2.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.19.w3.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.2.w1.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.2.w2.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.2.w3.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.20.w1.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.20.w2.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.20.w3.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.21.w1.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.21.w2.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.21.w3.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.22.w1.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.22.w2.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.22.w3.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.23.w1.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.23.w2.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.23.w3.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.24.w1.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.24.w2.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.24.w3.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.25.w1.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.25.w2.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.25.w3.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.26.w1.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.26.w2.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.26.w3.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.27.w1.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.27.w2.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.27.w3.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.28.w1.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.28.w2.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.28.w3.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.29.w1.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.29.w2.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.29.w3.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.3.w1.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.3.w2.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.3.w3.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.30.w1.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.30.w2.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.30.w3.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.31.w1.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.31.w2.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.31.w3.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.32.w1.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.32.w2.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.32.w3.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.33.w1.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.33.w2.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.33.w3.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.34.w1.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.34.w2.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.34.w3.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.35.w1.weight": "consolidated-00179-of-00272.safetensors", + "layers.46.experts.35.w2.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.35.w3.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.36.w1.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.36.w2.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.36.w3.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.37.w1.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.37.w2.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.37.w3.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.38.w1.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.38.w2.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.38.w3.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.39.w1.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.39.w2.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.39.w3.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.4.w1.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.4.w2.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.4.w3.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.40.w1.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.40.w2.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.40.w3.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.41.w1.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.41.w2.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.41.w3.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.42.w1.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.42.w2.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.42.w3.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.43.w1.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.43.w2.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.43.w3.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.44.w1.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.44.w2.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.44.w3.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.45.w1.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.45.w2.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.45.w3.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.46.w1.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.46.w2.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.46.w3.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.47.w1.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.47.w2.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.47.w3.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.48.w1.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.48.w2.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.48.w3.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.49.w1.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.49.w2.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.49.w3.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.5.w1.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.5.w2.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.5.w3.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.50.w1.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.50.w2.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.50.w3.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.51.w1.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.51.w2.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.51.w3.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.52.w1.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.52.w2.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.52.w3.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.53.w1.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.53.w2.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.53.w3.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.54.w1.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.54.w2.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.54.w3.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.55.w1.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.55.w2.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.55.w3.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.56.w1.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.56.w2.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.56.w3.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.57.w1.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.57.w2.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.57.w3.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.58.w1.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.58.w2.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.58.w3.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.59.w1.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.59.w2.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.59.w3.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.6.w1.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.6.w2.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.6.w3.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.60.w1.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.60.w2.weight": "consolidated-00180-of-00272.safetensors", + "layers.46.experts.60.w3.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.61.w1.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.61.w2.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.61.w3.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.62.w1.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.62.w2.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.62.w3.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.63.w1.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.63.w2.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.63.w3.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.64.w1.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.64.w2.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.64.w3.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.65.w1.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.65.w2.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.65.w3.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.66.w1.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.66.w2.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.66.w3.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.67.w1.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.67.w2.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.67.w3.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.68.w1.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.68.w2.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.68.w3.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.69.w1.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.69.w2.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.69.w3.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.7.w1.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.7.w2.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.7.w3.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.70.w1.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.70.w2.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.70.w3.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.71.w1.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.71.w2.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.71.w3.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.72.w1.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.72.w2.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.72.w3.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.73.w1.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.73.w2.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.73.w3.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.74.w1.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.74.w2.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.74.w3.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.75.w1.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.75.w2.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.75.w3.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.76.w1.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.76.w2.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.76.w3.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.77.w1.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.77.w2.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.77.w3.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.78.w1.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.78.w2.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.78.w3.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.79.w1.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.79.w2.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.79.w3.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.8.w1.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.8.w2.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.8.w3.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.80.w1.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.80.w2.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.80.w3.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.81.w1.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.81.w2.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.81.w3.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.82.w1.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.82.w2.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.82.w3.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.83.w1.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.83.w2.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.83.w3.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.84.w1.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.84.w2.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.84.w3.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.85.w1.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.85.w2.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.85.w3.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.86.w1.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.86.w2.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.86.w3.weight": "consolidated-00181-of-00272.safetensors", + "layers.46.experts.87.w1.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.87.w2.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.87.w3.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.88.w1.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.88.w2.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.88.w3.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.89.w1.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.89.w2.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.89.w3.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.9.w1.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.9.w2.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.9.w3.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.90.w1.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.90.w2.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.90.w3.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.91.w1.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.91.w2.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.91.w3.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.92.w1.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.92.w2.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.92.w3.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.93.w1.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.93.w2.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.93.w3.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.94.w1.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.94.w2.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.94.w3.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.95.w1.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.95.w2.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.95.w3.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.96.w1.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.96.w2.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.96.w3.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.97.w1.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.97.w2.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.97.w3.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.98.w1.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.98.w2.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.98.w3.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.99.w1.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.99.w2.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.experts.99.w3.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.ffn_norm.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.gate.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.shared_experts.w1.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.shared_experts.w2.weight": "consolidated-00182-of-00272.safetensors", + "layers.46.shared_experts.w3.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.attention.kv_a_norm.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.attention.q_a_norm.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.attention.wkv_a_with_mqa.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.attention.wkv_b.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.attention.wo.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.attention.wq_a.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.attention.wq_b.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.attention_norm.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.0.w1.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.0.w2.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.0.w3.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.1.w1.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.1.w2.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.1.w3.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.10.w1.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.10.w2.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.10.w3.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.100.w1.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.100.w2.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.100.w3.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.101.w1.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.101.w2.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.101.w3.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.102.w1.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.102.w2.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.102.w3.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.103.w1.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.103.w2.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.103.w3.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.104.w1.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.104.w2.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.104.w3.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.105.w1.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.105.w2.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.105.w3.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.106.w1.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.106.w2.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.106.w3.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.107.w1.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.107.w2.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.107.w3.weight": "consolidated-00182-of-00272.safetensors", + "layers.47.experts.108.w1.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.108.w2.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.108.w3.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.109.w1.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.109.w2.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.109.w3.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.11.w1.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.11.w2.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.11.w3.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.110.w1.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.110.w2.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.110.w3.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.111.w1.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.111.w2.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.111.w3.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.112.w1.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.112.w2.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.112.w3.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.113.w1.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.113.w2.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.113.w3.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.114.w1.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.114.w2.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.114.w3.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.115.w1.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.115.w2.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.115.w3.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.116.w1.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.116.w2.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.116.w3.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.117.w1.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.117.w2.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.117.w3.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.118.w1.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.118.w2.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.118.w3.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.119.w1.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.119.w2.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.119.w3.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.12.w1.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.12.w2.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.12.w3.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.120.w1.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.120.w2.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.120.w3.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.121.w1.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.121.w2.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.121.w3.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.122.w1.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.122.w2.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.122.w3.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.123.w1.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.123.w2.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.123.w3.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.124.w1.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.124.w2.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.124.w3.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.125.w1.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.125.w2.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.125.w3.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.126.w1.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.126.w2.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.126.w3.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.127.w1.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.127.w2.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.127.w3.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.13.w1.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.13.w2.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.13.w3.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.14.w1.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.14.w2.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.14.w3.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.15.w1.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.15.w2.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.15.w3.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.16.w1.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.16.w2.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.16.w3.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.17.w1.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.17.w2.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.17.w3.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.18.w1.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.18.w2.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.18.w3.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.19.w1.weight": "consolidated-00183-of-00272.safetensors", + "layers.47.experts.19.w2.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.19.w3.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.2.w1.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.2.w2.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.2.w3.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.20.w1.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.20.w2.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.20.w3.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.21.w1.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.21.w2.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.21.w3.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.22.w1.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.22.w2.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.22.w3.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.23.w1.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.23.w2.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.23.w3.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.24.w1.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.24.w2.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.24.w3.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.25.w1.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.25.w2.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.25.w3.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.26.w1.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.26.w2.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.26.w3.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.27.w1.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.27.w2.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.27.w3.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.28.w1.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.28.w2.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.28.w3.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.29.w1.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.29.w2.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.29.w3.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.3.w1.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.3.w2.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.3.w3.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.30.w1.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.30.w2.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.30.w3.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.31.w1.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.31.w2.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.31.w3.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.32.w1.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.32.w2.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.32.w3.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.33.w1.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.33.w2.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.33.w3.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.34.w1.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.34.w2.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.34.w3.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.35.w1.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.35.w2.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.35.w3.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.36.w1.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.36.w2.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.36.w3.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.37.w1.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.37.w2.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.37.w3.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.38.w1.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.38.w2.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.38.w3.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.39.w1.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.39.w2.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.39.w3.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.4.w1.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.4.w2.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.4.w3.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.40.w1.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.40.w2.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.40.w3.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.41.w1.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.41.w2.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.41.w3.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.42.w1.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.42.w2.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.42.w3.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.43.w1.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.43.w2.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.43.w3.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.44.w1.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.44.w2.weight": "consolidated-00184-of-00272.safetensors", + "layers.47.experts.44.w3.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.45.w1.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.45.w2.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.45.w3.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.46.w1.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.46.w2.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.46.w3.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.47.w1.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.47.w2.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.47.w3.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.48.w1.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.48.w2.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.48.w3.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.49.w1.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.49.w2.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.49.w3.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.5.w1.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.5.w2.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.5.w3.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.50.w1.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.50.w2.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.50.w3.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.51.w1.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.51.w2.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.51.w3.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.52.w1.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.52.w2.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.52.w3.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.53.w1.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.53.w2.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.53.w3.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.54.w1.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.54.w2.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.54.w3.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.55.w1.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.55.w2.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.55.w3.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.56.w1.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.56.w2.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.56.w3.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.57.w1.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.57.w2.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.57.w3.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.58.w1.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.58.w2.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.58.w3.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.59.w1.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.59.w2.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.59.w3.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.6.w1.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.6.w2.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.6.w3.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.60.w1.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.60.w2.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.60.w3.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.61.w1.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.61.w2.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.61.w3.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.62.w1.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.62.w2.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.62.w3.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.63.w1.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.63.w2.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.63.w3.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.64.w1.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.64.w2.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.64.w3.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.65.w1.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.65.w2.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.65.w3.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.66.w1.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.66.w2.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.66.w3.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.67.w1.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.67.w2.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.67.w3.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.68.w1.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.68.w2.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.68.w3.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.69.w1.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.69.w2.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.69.w3.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.7.w1.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.7.w2.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.7.w3.weight": "consolidated-00185-of-00272.safetensors", + "layers.47.experts.70.w1.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.70.w2.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.70.w3.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.71.w1.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.71.w2.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.71.w3.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.72.w1.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.72.w2.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.72.w3.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.73.w1.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.73.w2.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.73.w3.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.74.w1.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.74.w2.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.74.w3.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.75.w1.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.75.w2.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.75.w3.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.76.w1.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.76.w2.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.76.w3.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.77.w1.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.77.w2.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.77.w3.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.78.w1.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.78.w2.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.78.w3.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.79.w1.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.79.w2.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.79.w3.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.8.w1.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.8.w2.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.8.w3.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.80.w1.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.80.w2.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.80.w3.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.81.w1.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.81.w2.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.81.w3.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.82.w1.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.82.w2.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.82.w3.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.83.w1.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.83.w2.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.83.w3.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.84.w1.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.84.w2.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.84.w3.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.85.w1.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.85.w2.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.85.w3.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.86.w1.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.86.w2.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.86.w3.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.87.w1.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.87.w2.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.87.w3.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.88.w1.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.88.w2.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.88.w3.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.89.w1.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.89.w2.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.89.w3.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.9.w1.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.9.w2.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.9.w3.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.90.w1.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.90.w2.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.90.w3.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.91.w1.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.91.w2.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.91.w3.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.92.w1.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.92.w2.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.92.w3.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.93.w1.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.93.w2.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.93.w3.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.94.w1.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.94.w2.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.94.w3.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.95.w1.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.95.w2.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.95.w3.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.96.w1.weight": "consolidated-00186-of-00272.safetensors", + "layers.47.experts.96.w2.weight": "consolidated-00187-of-00272.safetensors", + "layers.47.experts.96.w3.weight": "consolidated-00187-of-00272.safetensors", + "layers.47.experts.97.w1.weight": "consolidated-00187-of-00272.safetensors", + "layers.47.experts.97.w2.weight": "consolidated-00187-of-00272.safetensors", + "layers.47.experts.97.w3.weight": "consolidated-00187-of-00272.safetensors", + "layers.47.experts.98.w1.weight": "consolidated-00187-of-00272.safetensors", + "layers.47.experts.98.w2.weight": "consolidated-00187-of-00272.safetensors", + "layers.47.experts.98.w3.weight": "consolidated-00187-of-00272.safetensors", + "layers.47.experts.99.w1.weight": "consolidated-00187-of-00272.safetensors", + "layers.47.experts.99.w2.weight": "consolidated-00187-of-00272.safetensors", + "layers.47.experts.99.w3.weight": "consolidated-00187-of-00272.safetensors", + "layers.47.ffn_norm.weight": "consolidated-00187-of-00272.safetensors", + "layers.47.gate.weight": "consolidated-00187-of-00272.safetensors", + "layers.47.shared_experts.w1.weight": "consolidated-00187-of-00272.safetensors", + "layers.47.shared_experts.w2.weight": "consolidated-00187-of-00272.safetensors", + "layers.47.shared_experts.w3.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.attention.kv_a_norm.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.attention.q_a_norm.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.attention.wkv_a_with_mqa.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.attention.wkv_b.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.attention.wo.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.attention.wq_a.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.attention.wq_b.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.attention_norm.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.0.w1.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.0.w2.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.0.w3.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.1.w1.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.1.w2.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.1.w3.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.10.w1.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.10.w2.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.10.w3.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.100.w1.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.100.w2.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.100.w3.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.101.w1.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.101.w2.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.101.w3.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.102.w1.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.102.w2.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.102.w3.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.103.w1.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.103.w2.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.103.w3.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.104.w1.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.104.w2.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.104.w3.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.105.w1.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.105.w2.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.105.w3.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.106.w1.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.106.w2.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.106.w3.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.107.w1.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.107.w2.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.107.w3.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.108.w1.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.108.w2.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.108.w3.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.109.w1.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.109.w2.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.109.w3.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.11.w1.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.11.w2.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.11.w3.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.110.w1.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.110.w2.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.110.w3.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.111.w1.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.111.w2.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.111.w3.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.112.w1.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.112.w2.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.112.w3.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.113.w1.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.113.w2.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.113.w3.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.114.w1.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.114.w2.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.114.w3.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.115.w1.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.115.w2.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.115.w3.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.116.w1.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.116.w2.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.116.w3.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.117.w1.weight": "consolidated-00187-of-00272.safetensors", + "layers.48.experts.117.w2.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.117.w3.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.118.w1.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.118.w2.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.118.w3.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.119.w1.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.119.w2.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.119.w3.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.12.w1.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.12.w2.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.12.w3.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.120.w1.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.120.w2.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.120.w3.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.121.w1.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.121.w2.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.121.w3.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.122.w1.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.122.w2.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.122.w3.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.123.w1.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.123.w2.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.123.w3.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.124.w1.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.124.w2.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.124.w3.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.125.w1.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.125.w2.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.125.w3.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.126.w1.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.126.w2.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.126.w3.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.127.w1.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.127.w2.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.127.w3.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.13.w1.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.13.w2.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.13.w3.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.14.w1.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.14.w2.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.14.w3.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.15.w1.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.15.w2.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.15.w3.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.16.w1.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.16.w2.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.16.w3.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.17.w1.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.17.w2.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.17.w3.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.18.w1.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.18.w2.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.18.w3.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.19.w1.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.19.w2.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.19.w3.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.2.w1.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.2.w2.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.2.w3.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.20.w1.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.20.w2.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.20.w3.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.21.w1.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.21.w2.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.21.w3.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.22.w1.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.22.w2.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.22.w3.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.23.w1.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.23.w2.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.23.w3.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.24.w1.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.24.w2.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.24.w3.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.25.w1.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.25.w2.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.25.w3.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.26.w1.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.26.w2.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.26.w3.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.27.w1.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.27.w2.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.27.w3.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.28.w1.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.28.w2.weight": "consolidated-00188-of-00272.safetensors", + "layers.48.experts.28.w3.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.29.w1.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.29.w2.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.29.w3.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.3.w1.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.3.w2.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.3.w3.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.30.w1.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.30.w2.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.30.w3.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.31.w1.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.31.w2.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.31.w3.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.32.w1.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.32.w2.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.32.w3.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.33.w1.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.33.w2.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.33.w3.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.34.w1.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.34.w2.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.34.w3.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.35.w1.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.35.w2.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.35.w3.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.36.w1.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.36.w2.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.36.w3.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.37.w1.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.37.w2.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.37.w3.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.38.w1.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.38.w2.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.38.w3.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.39.w1.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.39.w2.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.39.w3.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.4.w1.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.4.w2.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.4.w3.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.40.w1.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.40.w2.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.40.w3.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.41.w1.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.41.w2.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.41.w3.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.42.w1.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.42.w2.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.42.w3.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.43.w1.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.43.w2.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.43.w3.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.44.w1.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.44.w2.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.44.w3.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.45.w1.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.45.w2.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.45.w3.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.46.w1.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.46.w2.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.46.w3.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.47.w1.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.47.w2.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.47.w3.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.48.w1.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.48.w2.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.48.w3.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.49.w1.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.49.w2.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.49.w3.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.5.w1.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.5.w2.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.5.w3.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.50.w1.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.50.w2.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.50.w3.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.51.w1.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.51.w2.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.51.w3.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.52.w1.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.52.w2.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.52.w3.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.53.w1.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.53.w2.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.53.w3.weight": "consolidated-00189-of-00272.safetensors", + "layers.48.experts.54.w1.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.54.w2.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.54.w3.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.55.w1.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.55.w2.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.55.w3.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.56.w1.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.56.w2.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.56.w3.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.57.w1.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.57.w2.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.57.w3.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.58.w1.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.58.w2.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.58.w3.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.59.w1.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.59.w2.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.59.w3.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.6.w1.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.6.w2.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.6.w3.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.60.w1.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.60.w2.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.60.w3.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.61.w1.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.61.w2.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.61.w3.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.62.w1.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.62.w2.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.62.w3.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.63.w1.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.63.w2.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.63.w3.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.64.w1.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.64.w2.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.64.w3.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.65.w1.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.65.w2.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.65.w3.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.66.w1.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.66.w2.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.66.w3.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.67.w1.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.67.w2.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.67.w3.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.68.w1.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.68.w2.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.68.w3.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.69.w1.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.69.w2.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.69.w3.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.7.w1.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.7.w2.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.7.w3.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.70.w1.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.70.w2.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.70.w3.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.71.w1.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.71.w2.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.71.w3.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.72.w1.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.72.w2.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.72.w3.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.73.w1.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.73.w2.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.73.w3.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.74.w1.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.74.w2.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.74.w3.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.75.w1.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.75.w2.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.75.w3.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.76.w1.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.76.w2.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.76.w3.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.77.w1.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.77.w2.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.77.w3.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.78.w1.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.78.w2.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.78.w3.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.79.w1.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.79.w2.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.79.w3.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.8.w1.weight": "consolidated-00190-of-00272.safetensors", + "layers.48.experts.8.w2.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.8.w3.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.80.w1.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.80.w2.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.80.w3.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.81.w1.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.81.w2.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.81.w3.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.82.w1.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.82.w2.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.82.w3.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.83.w1.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.83.w2.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.83.w3.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.84.w1.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.84.w2.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.84.w3.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.85.w1.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.85.w2.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.85.w3.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.86.w1.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.86.w2.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.86.w3.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.87.w1.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.87.w2.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.87.w3.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.88.w1.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.88.w2.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.88.w3.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.89.w1.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.89.w2.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.89.w3.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.9.w1.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.9.w2.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.9.w3.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.90.w1.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.90.w2.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.90.w3.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.91.w1.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.91.w2.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.91.w3.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.92.w1.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.92.w2.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.92.w3.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.93.w1.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.93.w2.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.93.w3.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.94.w1.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.94.w2.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.94.w3.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.95.w1.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.95.w2.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.95.w3.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.96.w1.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.96.w2.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.96.w3.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.97.w1.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.97.w2.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.97.w3.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.98.w1.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.98.w2.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.98.w3.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.99.w1.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.99.w2.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.experts.99.w3.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.ffn_norm.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.gate.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.shared_experts.w1.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.shared_experts.w2.weight": "consolidated-00191-of-00272.safetensors", + "layers.48.shared_experts.w3.weight": "consolidated-00191-of-00272.safetensors", + "layers.49.attention.kv_a_norm.weight": "consolidated-00191-of-00272.safetensors", + "layers.49.attention.q_a_norm.weight": "consolidated-00191-of-00272.safetensors", + "layers.49.attention.wkv_a_with_mqa.weight": "consolidated-00191-of-00272.safetensors", + "layers.49.attention.wkv_b.weight": "consolidated-00191-of-00272.safetensors", + "layers.49.attention.wo.weight": "consolidated-00191-of-00272.safetensors", + "layers.49.attention.wq_a.weight": "consolidated-00191-of-00272.safetensors", + "layers.49.attention.wq_b.weight": "consolidated-00191-of-00272.safetensors", + "layers.49.attention_norm.weight": "consolidated-00191-of-00272.safetensors", + "layers.49.experts.0.w1.weight": "consolidated-00191-of-00272.safetensors", + "layers.49.experts.0.w2.weight": "consolidated-00191-of-00272.safetensors", + "layers.49.experts.0.w3.weight": "consolidated-00191-of-00272.safetensors", + "layers.49.experts.1.w1.weight": "consolidated-00191-of-00272.safetensors", + "layers.49.experts.1.w2.weight": "consolidated-00191-of-00272.safetensors", + "layers.49.experts.1.w3.weight": "consolidated-00191-of-00272.safetensors", + "layers.49.experts.10.w1.weight": "consolidated-00191-of-00272.safetensors", + "layers.49.experts.10.w2.weight": "consolidated-00191-of-00272.safetensors", + "layers.49.experts.10.w3.weight": "consolidated-00191-of-00272.safetensors", + "layers.49.experts.100.w1.weight": "consolidated-00191-of-00272.safetensors", + "layers.49.experts.100.w2.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.100.w3.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.101.w1.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.101.w2.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.101.w3.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.102.w1.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.102.w2.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.102.w3.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.103.w1.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.103.w2.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.103.w3.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.104.w1.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.104.w2.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.104.w3.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.105.w1.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.105.w2.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.105.w3.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.106.w1.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.106.w2.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.106.w3.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.107.w1.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.107.w2.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.107.w3.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.108.w1.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.108.w2.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.108.w3.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.109.w1.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.109.w2.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.109.w3.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.11.w1.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.11.w2.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.11.w3.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.110.w1.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.110.w2.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.110.w3.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.111.w1.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.111.w2.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.111.w3.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.112.w1.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.112.w2.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.112.w3.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.113.w1.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.113.w2.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.113.w3.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.114.w1.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.114.w2.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.114.w3.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.115.w1.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.115.w2.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.115.w3.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.116.w1.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.116.w2.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.116.w3.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.117.w1.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.117.w2.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.117.w3.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.118.w1.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.118.w2.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.118.w3.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.119.w1.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.119.w2.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.119.w3.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.12.w1.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.12.w2.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.12.w3.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.120.w1.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.120.w2.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.120.w3.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.121.w1.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.121.w2.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.121.w3.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.122.w1.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.122.w2.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.122.w3.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.123.w1.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.123.w2.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.123.w3.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.124.w1.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.124.w2.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.124.w3.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.125.w1.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.125.w2.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.125.w3.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.126.w1.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.126.w2.weight": "consolidated-00192-of-00272.safetensors", + "layers.49.experts.126.w3.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.127.w1.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.127.w2.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.127.w3.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.13.w1.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.13.w2.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.13.w3.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.14.w1.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.14.w2.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.14.w3.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.15.w1.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.15.w2.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.15.w3.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.16.w1.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.16.w2.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.16.w3.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.17.w1.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.17.w2.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.17.w3.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.18.w1.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.18.w2.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.18.w3.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.19.w1.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.19.w2.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.19.w3.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.2.w1.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.2.w2.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.2.w3.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.20.w1.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.20.w2.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.20.w3.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.21.w1.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.21.w2.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.21.w3.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.22.w1.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.22.w2.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.22.w3.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.23.w1.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.23.w2.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.23.w3.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.24.w1.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.24.w2.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.24.w3.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.25.w1.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.25.w2.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.25.w3.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.26.w1.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.26.w2.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.26.w3.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.27.w1.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.27.w2.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.27.w3.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.28.w1.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.28.w2.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.28.w3.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.29.w1.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.29.w2.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.29.w3.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.3.w1.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.3.w2.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.3.w3.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.30.w1.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.30.w2.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.30.w3.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.31.w1.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.31.w2.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.31.w3.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.32.w1.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.32.w2.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.32.w3.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.33.w1.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.33.w2.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.33.w3.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.34.w1.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.34.w2.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.34.w3.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.35.w1.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.35.w2.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.35.w3.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.36.w1.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.36.w2.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.36.w3.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.37.w1.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.37.w2.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.37.w3.weight": "consolidated-00193-of-00272.safetensors", + "layers.49.experts.38.w1.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.38.w2.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.38.w3.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.39.w1.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.39.w2.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.39.w3.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.4.w1.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.4.w2.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.4.w3.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.40.w1.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.40.w2.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.40.w3.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.41.w1.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.41.w2.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.41.w3.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.42.w1.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.42.w2.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.42.w3.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.43.w1.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.43.w2.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.43.w3.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.44.w1.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.44.w2.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.44.w3.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.45.w1.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.45.w2.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.45.w3.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.46.w1.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.46.w2.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.46.w3.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.47.w1.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.47.w2.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.47.w3.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.48.w1.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.48.w2.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.48.w3.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.49.w1.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.49.w2.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.49.w3.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.5.w1.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.5.w2.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.5.w3.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.50.w1.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.50.w2.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.50.w3.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.51.w1.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.51.w2.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.51.w3.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.52.w1.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.52.w2.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.52.w3.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.53.w1.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.53.w2.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.53.w3.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.54.w1.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.54.w2.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.54.w3.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.55.w1.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.55.w2.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.55.w3.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.56.w1.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.56.w2.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.56.w3.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.57.w1.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.57.w2.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.57.w3.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.58.w1.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.58.w2.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.58.w3.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.59.w1.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.59.w2.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.59.w3.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.6.w1.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.6.w2.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.6.w3.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.60.w1.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.60.w2.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.60.w3.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.61.w1.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.61.w2.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.61.w3.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.62.w1.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.62.w2.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.62.w3.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.63.w1.weight": "consolidated-00194-of-00272.safetensors", + "layers.49.experts.63.w2.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.63.w3.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.64.w1.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.64.w2.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.64.w3.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.65.w1.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.65.w2.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.65.w3.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.66.w1.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.66.w2.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.66.w3.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.67.w1.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.67.w2.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.67.w3.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.68.w1.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.68.w2.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.68.w3.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.69.w1.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.69.w2.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.69.w3.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.7.w1.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.7.w2.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.7.w3.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.70.w1.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.70.w2.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.70.w3.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.71.w1.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.71.w2.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.71.w3.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.72.w1.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.72.w2.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.72.w3.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.73.w1.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.73.w2.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.73.w3.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.74.w1.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.74.w2.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.74.w3.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.75.w1.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.75.w2.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.75.w3.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.76.w1.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.76.w2.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.76.w3.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.77.w1.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.77.w2.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.77.w3.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.78.w1.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.78.w2.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.78.w3.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.79.w1.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.79.w2.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.79.w3.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.8.w1.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.8.w2.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.8.w3.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.80.w1.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.80.w2.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.80.w3.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.81.w1.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.81.w2.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.81.w3.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.82.w1.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.82.w2.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.82.w3.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.83.w1.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.83.w2.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.83.w3.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.84.w1.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.84.w2.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.84.w3.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.85.w1.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.85.w2.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.85.w3.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.86.w1.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.86.w2.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.86.w3.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.87.w1.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.87.w2.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.87.w3.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.88.w1.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.88.w2.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.88.w3.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.89.w1.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.89.w2.weight": "consolidated-00195-of-00272.safetensors", + "layers.49.experts.89.w3.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.9.w1.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.9.w2.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.9.w3.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.90.w1.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.90.w2.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.90.w3.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.91.w1.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.91.w2.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.91.w3.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.92.w1.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.92.w2.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.92.w3.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.93.w1.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.93.w2.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.93.w3.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.94.w1.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.94.w2.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.94.w3.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.95.w1.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.95.w2.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.95.w3.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.96.w1.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.96.w2.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.96.w3.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.97.w1.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.97.w2.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.97.w3.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.98.w1.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.98.w2.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.98.w3.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.99.w1.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.99.w2.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.experts.99.w3.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.ffn_norm.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.gate.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.shared_experts.w1.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.shared_experts.w2.weight": "consolidated-00196-of-00272.safetensors", + "layers.49.shared_experts.w3.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.attention.kv_a_norm.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.attention.q_a_norm.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.attention.wkv_a_with_mqa.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.attention.wkv_b.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.attention.wo.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.attention.wq_a.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.attention.wq_b.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.attention_norm.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.0.w1.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.0.w2.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.0.w3.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.1.w1.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.1.w2.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.1.w3.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.10.w1.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.10.w2.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.10.w3.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.100.w1.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.100.w2.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.100.w3.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.101.w1.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.101.w2.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.101.w3.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.102.w1.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.102.w2.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.102.w3.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.103.w1.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.103.w2.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.103.w3.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.104.w1.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.104.w2.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.104.w3.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.105.w1.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.105.w2.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.105.w3.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.106.w1.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.106.w2.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.106.w3.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.107.w1.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.107.w2.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.107.w3.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.108.w1.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.108.w2.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.108.w3.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.109.w1.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.109.w2.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.109.w3.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.11.w1.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.11.w2.weight": "consolidated-00196-of-00272.safetensors", + "layers.5.experts.11.w3.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.110.w1.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.110.w2.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.110.w3.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.111.w1.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.111.w2.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.111.w3.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.112.w1.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.112.w2.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.112.w3.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.113.w1.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.113.w2.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.113.w3.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.114.w1.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.114.w2.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.114.w3.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.115.w1.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.115.w2.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.115.w3.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.116.w1.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.116.w2.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.116.w3.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.117.w1.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.117.w2.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.117.w3.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.118.w1.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.118.w2.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.118.w3.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.119.w1.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.119.w2.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.119.w3.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.12.w1.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.12.w2.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.12.w3.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.120.w1.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.120.w2.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.120.w3.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.121.w1.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.121.w2.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.121.w3.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.122.w1.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.122.w2.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.122.w3.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.123.w1.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.123.w2.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.123.w3.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.124.w1.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.124.w2.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.124.w3.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.125.w1.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.125.w2.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.125.w3.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.126.w1.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.126.w2.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.126.w3.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.127.w1.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.127.w2.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.127.w3.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.13.w1.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.13.w2.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.13.w3.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.14.w1.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.14.w2.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.14.w3.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.15.w1.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.15.w2.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.15.w3.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.16.w1.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.16.w2.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.16.w3.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.17.w1.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.17.w2.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.17.w3.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.18.w1.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.18.w2.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.18.w3.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.19.w1.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.19.w2.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.19.w3.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.2.w1.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.2.w2.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.2.w3.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.20.w1.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.20.w2.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.20.w3.weight": "consolidated-00197-of-00272.safetensors", + "layers.5.experts.21.w1.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.21.w2.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.21.w3.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.22.w1.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.22.w2.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.22.w3.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.23.w1.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.23.w2.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.23.w3.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.24.w1.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.24.w2.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.24.w3.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.25.w1.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.25.w2.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.25.w3.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.26.w1.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.26.w2.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.26.w3.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.27.w1.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.27.w2.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.27.w3.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.28.w1.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.28.w2.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.28.w3.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.29.w1.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.29.w2.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.29.w3.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.3.w1.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.3.w2.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.3.w3.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.30.w1.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.30.w2.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.30.w3.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.31.w1.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.31.w2.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.31.w3.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.32.w1.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.32.w2.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.32.w3.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.33.w1.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.33.w2.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.33.w3.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.34.w1.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.34.w2.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.34.w3.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.35.w1.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.35.w2.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.35.w3.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.36.w1.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.36.w2.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.36.w3.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.37.w1.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.37.w2.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.37.w3.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.38.w1.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.38.w2.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.38.w3.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.39.w1.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.39.w2.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.39.w3.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.4.w1.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.4.w2.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.4.w3.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.40.w1.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.40.w2.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.40.w3.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.41.w1.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.41.w2.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.41.w3.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.42.w1.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.42.w2.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.42.w3.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.43.w1.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.43.w2.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.43.w3.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.44.w1.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.44.w2.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.44.w3.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.45.w1.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.45.w2.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.45.w3.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.46.w1.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.46.w2.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.46.w3.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.47.w1.weight": "consolidated-00198-of-00272.safetensors", + "layers.5.experts.47.w2.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.47.w3.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.48.w1.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.48.w2.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.48.w3.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.49.w1.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.49.w2.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.49.w3.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.5.w1.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.5.w2.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.5.w3.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.50.w1.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.50.w2.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.50.w3.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.51.w1.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.51.w2.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.51.w3.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.52.w1.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.52.w2.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.52.w3.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.53.w1.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.53.w2.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.53.w3.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.54.w1.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.54.w2.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.54.w3.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.55.w1.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.55.w2.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.55.w3.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.56.w1.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.56.w2.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.56.w3.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.57.w1.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.57.w2.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.57.w3.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.58.w1.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.58.w2.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.58.w3.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.59.w1.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.59.w2.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.59.w3.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.6.w1.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.6.w2.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.6.w3.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.60.w1.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.60.w2.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.60.w3.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.61.w1.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.61.w2.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.61.w3.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.62.w1.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.62.w2.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.62.w3.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.63.w1.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.63.w2.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.63.w3.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.64.w1.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.64.w2.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.64.w3.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.65.w1.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.65.w2.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.65.w3.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.66.w1.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.66.w2.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.66.w3.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.67.w1.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.67.w2.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.67.w3.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.68.w1.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.68.w2.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.68.w3.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.69.w1.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.69.w2.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.69.w3.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.7.w1.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.7.w2.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.7.w3.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.70.w1.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.70.w2.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.70.w3.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.71.w1.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.71.w2.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.71.w3.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.72.w1.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.72.w2.weight": "consolidated-00199-of-00272.safetensors", + "layers.5.experts.72.w3.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.73.w1.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.73.w2.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.73.w3.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.74.w1.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.74.w2.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.74.w3.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.75.w1.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.75.w2.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.75.w3.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.76.w1.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.76.w2.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.76.w3.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.77.w1.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.77.w2.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.77.w3.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.78.w1.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.78.w2.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.78.w3.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.79.w1.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.79.w2.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.79.w3.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.8.w1.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.8.w2.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.8.w3.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.80.w1.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.80.w2.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.80.w3.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.81.w1.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.81.w2.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.81.w3.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.82.w1.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.82.w2.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.82.w3.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.83.w1.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.83.w2.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.83.w3.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.84.w1.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.84.w2.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.84.w3.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.85.w1.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.85.w2.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.85.w3.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.86.w1.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.86.w2.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.86.w3.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.87.w1.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.87.w2.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.87.w3.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.88.w1.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.88.w2.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.88.w3.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.89.w1.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.89.w2.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.89.w3.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.9.w1.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.9.w2.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.9.w3.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.90.w1.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.90.w2.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.90.w3.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.91.w1.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.91.w2.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.91.w3.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.92.w1.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.92.w2.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.92.w3.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.93.w1.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.93.w2.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.93.w3.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.94.w1.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.94.w2.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.94.w3.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.95.w1.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.95.w2.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.95.w3.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.96.w1.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.96.w2.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.96.w3.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.97.w1.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.97.w2.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.97.w3.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.98.w1.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.98.w2.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.98.w3.weight": "consolidated-00200-of-00272.safetensors", + "layers.5.experts.99.w1.weight": "consolidated-00201-of-00272.safetensors", + "layers.5.experts.99.w2.weight": "consolidated-00201-of-00272.safetensors", + "layers.5.experts.99.w3.weight": "consolidated-00201-of-00272.safetensors", + "layers.5.ffn_norm.weight": "consolidated-00201-of-00272.safetensors", + "layers.5.gate.weight": "consolidated-00201-of-00272.safetensors", + "layers.5.shared_experts.w1.weight": "consolidated-00201-of-00272.safetensors", + "layers.5.shared_experts.w2.weight": "consolidated-00201-of-00272.safetensors", + "layers.5.shared_experts.w3.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.attention.kv_a_norm.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.attention.q_a_norm.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.attention.wkv_a_with_mqa.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.attention.wkv_b.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.attention.wo.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.attention.wq_a.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.attention.wq_b.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.attention_norm.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.0.w1.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.0.w2.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.0.w3.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.1.w1.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.1.w2.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.1.w3.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.10.w1.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.10.w2.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.10.w3.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.100.w1.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.100.w2.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.100.w3.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.101.w1.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.101.w2.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.101.w3.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.102.w1.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.102.w2.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.102.w3.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.103.w1.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.103.w2.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.103.w3.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.104.w1.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.104.w2.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.104.w3.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.105.w1.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.105.w2.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.105.w3.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.106.w1.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.106.w2.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.106.w3.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.107.w1.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.107.w2.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.107.w3.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.108.w1.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.108.w2.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.108.w3.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.109.w1.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.109.w2.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.109.w3.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.11.w1.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.11.w2.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.11.w3.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.110.w1.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.110.w2.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.110.w3.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.111.w1.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.111.w2.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.111.w3.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.112.w1.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.112.w2.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.112.w3.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.113.w1.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.113.w2.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.113.w3.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.114.w1.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.114.w2.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.114.w3.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.115.w1.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.115.w2.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.115.w3.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.116.w1.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.116.w2.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.116.w3.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.117.w1.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.117.w2.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.117.w3.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.118.w1.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.118.w2.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.118.w3.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.119.w1.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.119.w2.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.119.w3.weight": "consolidated-00201-of-00272.safetensors", + "layers.50.experts.12.w1.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.12.w2.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.12.w3.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.120.w1.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.120.w2.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.120.w3.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.121.w1.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.121.w2.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.121.w3.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.122.w1.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.122.w2.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.122.w3.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.123.w1.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.123.w2.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.123.w3.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.124.w1.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.124.w2.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.124.w3.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.125.w1.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.125.w2.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.125.w3.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.126.w1.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.126.w2.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.126.w3.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.127.w1.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.127.w2.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.127.w3.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.13.w1.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.13.w2.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.13.w3.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.14.w1.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.14.w2.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.14.w3.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.15.w1.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.15.w2.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.15.w3.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.16.w1.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.16.w2.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.16.w3.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.17.w1.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.17.w2.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.17.w3.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.18.w1.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.18.w2.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.18.w3.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.19.w1.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.19.w2.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.19.w3.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.2.w1.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.2.w2.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.2.w3.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.20.w1.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.20.w2.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.20.w3.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.21.w1.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.21.w2.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.21.w3.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.22.w1.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.22.w2.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.22.w3.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.23.w1.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.23.w2.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.23.w3.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.24.w1.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.24.w2.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.24.w3.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.25.w1.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.25.w2.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.25.w3.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.26.w1.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.26.w2.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.26.w3.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.27.w1.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.27.w2.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.27.w3.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.28.w1.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.28.w2.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.28.w3.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.29.w1.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.29.w2.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.29.w3.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.3.w1.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.3.w2.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.3.w3.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.30.w1.weight": "consolidated-00202-of-00272.safetensors", + "layers.50.experts.30.w2.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.30.w3.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.31.w1.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.31.w2.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.31.w3.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.32.w1.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.32.w2.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.32.w3.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.33.w1.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.33.w2.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.33.w3.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.34.w1.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.34.w2.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.34.w3.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.35.w1.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.35.w2.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.35.w3.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.36.w1.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.36.w2.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.36.w3.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.37.w1.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.37.w2.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.37.w3.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.38.w1.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.38.w2.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.38.w3.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.39.w1.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.39.w2.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.39.w3.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.4.w1.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.4.w2.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.4.w3.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.40.w1.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.40.w2.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.40.w3.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.41.w1.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.41.w2.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.41.w3.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.42.w1.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.42.w2.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.42.w3.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.43.w1.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.43.w2.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.43.w3.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.44.w1.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.44.w2.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.44.w3.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.45.w1.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.45.w2.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.45.w3.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.46.w1.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.46.w2.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.46.w3.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.47.w1.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.47.w2.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.47.w3.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.48.w1.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.48.w2.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.48.w3.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.49.w1.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.49.w2.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.49.w3.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.5.w1.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.5.w2.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.5.w3.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.50.w1.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.50.w2.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.50.w3.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.51.w1.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.51.w2.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.51.w3.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.52.w1.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.52.w2.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.52.w3.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.53.w1.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.53.w2.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.53.w3.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.54.w1.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.54.w2.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.54.w3.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.55.w1.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.55.w2.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.55.w3.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.56.w1.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.56.w2.weight": "consolidated-00203-of-00272.safetensors", + "layers.50.experts.56.w3.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.57.w1.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.57.w2.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.57.w3.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.58.w1.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.58.w2.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.58.w3.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.59.w1.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.59.w2.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.59.w3.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.6.w1.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.6.w2.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.6.w3.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.60.w1.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.60.w2.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.60.w3.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.61.w1.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.61.w2.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.61.w3.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.62.w1.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.62.w2.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.62.w3.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.63.w1.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.63.w2.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.63.w3.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.64.w1.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.64.w2.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.64.w3.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.65.w1.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.65.w2.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.65.w3.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.66.w1.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.66.w2.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.66.w3.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.67.w1.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.67.w2.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.67.w3.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.68.w1.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.68.w2.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.68.w3.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.69.w1.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.69.w2.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.69.w3.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.7.w1.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.7.w2.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.7.w3.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.70.w1.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.70.w2.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.70.w3.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.71.w1.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.71.w2.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.71.w3.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.72.w1.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.72.w2.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.72.w3.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.73.w1.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.73.w2.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.73.w3.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.74.w1.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.74.w2.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.74.w3.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.75.w1.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.75.w2.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.75.w3.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.76.w1.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.76.w2.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.76.w3.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.77.w1.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.77.w2.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.77.w3.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.78.w1.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.78.w2.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.78.w3.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.79.w1.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.79.w2.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.79.w3.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.8.w1.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.8.w2.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.8.w3.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.80.w1.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.80.w2.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.80.w3.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.81.w1.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.81.w2.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.81.w3.weight": "consolidated-00204-of-00272.safetensors", + "layers.50.experts.82.w1.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.82.w2.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.82.w3.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.83.w1.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.83.w2.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.83.w3.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.84.w1.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.84.w2.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.84.w3.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.85.w1.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.85.w2.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.85.w3.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.86.w1.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.86.w2.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.86.w3.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.87.w1.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.87.w2.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.87.w3.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.88.w1.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.88.w2.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.88.w3.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.89.w1.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.89.w2.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.89.w3.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.9.w1.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.9.w2.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.9.w3.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.90.w1.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.90.w2.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.90.w3.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.91.w1.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.91.w2.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.91.w3.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.92.w1.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.92.w2.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.92.w3.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.93.w1.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.93.w2.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.93.w3.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.94.w1.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.94.w2.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.94.w3.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.95.w1.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.95.w2.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.95.w3.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.96.w1.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.96.w2.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.96.w3.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.97.w1.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.97.w2.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.97.w3.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.98.w1.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.98.w2.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.98.w3.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.99.w1.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.99.w2.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.experts.99.w3.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.ffn_norm.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.gate.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.shared_experts.w1.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.shared_experts.w2.weight": "consolidated-00205-of-00272.safetensors", + "layers.50.shared_experts.w3.weight": "consolidated-00205-of-00272.safetensors", + "layers.51.attention.kv_a_norm.weight": "consolidated-00205-of-00272.safetensors", + "layers.51.attention.q_a_norm.weight": "consolidated-00205-of-00272.safetensors", + "layers.51.attention.wkv_a_with_mqa.weight": "consolidated-00205-of-00272.safetensors", + "layers.51.attention.wkv_b.weight": "consolidated-00205-of-00272.safetensors", + "layers.51.attention.wo.weight": "consolidated-00205-of-00272.safetensors", + "layers.51.attention.wq_a.weight": "consolidated-00205-of-00272.safetensors", + "layers.51.attention.wq_b.weight": "consolidated-00205-of-00272.safetensors", + "layers.51.attention_norm.weight": "consolidated-00205-of-00272.safetensors", + "layers.51.experts.0.w1.weight": "consolidated-00205-of-00272.safetensors", + "layers.51.experts.0.w2.weight": "consolidated-00205-of-00272.safetensors", + "layers.51.experts.0.w3.weight": "consolidated-00205-of-00272.safetensors", + "layers.51.experts.1.w1.weight": "consolidated-00205-of-00272.safetensors", + "layers.51.experts.1.w2.weight": "consolidated-00205-of-00272.safetensors", + "layers.51.experts.1.w3.weight": "consolidated-00205-of-00272.safetensors", + "layers.51.experts.10.w1.weight": "consolidated-00205-of-00272.safetensors", + "layers.51.experts.10.w2.weight": "consolidated-00205-of-00272.safetensors", + "layers.51.experts.10.w3.weight": "consolidated-00205-of-00272.safetensors", + "layers.51.experts.100.w1.weight": "consolidated-00205-of-00272.safetensors", + "layers.51.experts.100.w2.weight": "consolidated-00205-of-00272.safetensors", + "layers.51.experts.100.w3.weight": "consolidated-00205-of-00272.safetensors", + "layers.51.experts.101.w1.weight": "consolidated-00205-of-00272.safetensors", + "layers.51.experts.101.w2.weight": "consolidated-00205-of-00272.safetensors", + "layers.51.experts.101.w3.weight": "consolidated-00205-of-00272.safetensors", + "layers.51.experts.102.w1.weight": "consolidated-00205-of-00272.safetensors", + "layers.51.experts.102.w2.weight": "consolidated-00205-of-00272.safetensors", + "layers.51.experts.102.w3.weight": "consolidated-00205-of-00272.safetensors", + "layers.51.experts.103.w1.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.103.w2.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.103.w3.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.104.w1.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.104.w2.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.104.w3.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.105.w1.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.105.w2.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.105.w3.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.106.w1.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.106.w2.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.106.w3.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.107.w1.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.107.w2.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.107.w3.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.108.w1.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.108.w2.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.108.w3.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.109.w1.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.109.w2.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.109.w3.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.11.w1.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.11.w2.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.11.w3.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.110.w1.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.110.w2.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.110.w3.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.111.w1.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.111.w2.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.111.w3.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.112.w1.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.112.w2.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.112.w3.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.113.w1.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.113.w2.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.113.w3.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.114.w1.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.114.w2.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.114.w3.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.115.w1.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.115.w2.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.115.w3.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.116.w1.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.116.w2.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.116.w3.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.117.w1.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.117.w2.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.117.w3.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.118.w1.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.118.w2.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.118.w3.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.119.w1.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.119.w2.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.119.w3.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.12.w1.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.12.w2.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.12.w3.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.120.w1.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.120.w2.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.120.w3.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.121.w1.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.121.w2.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.121.w3.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.122.w1.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.122.w2.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.122.w3.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.123.w1.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.123.w2.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.123.w3.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.124.w1.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.124.w2.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.124.w3.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.125.w1.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.125.w2.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.125.w3.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.126.w1.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.126.w2.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.126.w3.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.127.w1.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.127.w2.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.127.w3.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.13.w1.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.13.w2.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.13.w3.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.14.w1.weight": "consolidated-00206-of-00272.safetensors", + "layers.51.experts.14.w2.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.14.w3.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.15.w1.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.15.w2.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.15.w3.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.16.w1.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.16.w2.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.16.w3.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.17.w1.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.17.w2.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.17.w3.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.18.w1.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.18.w2.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.18.w3.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.19.w1.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.19.w2.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.19.w3.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.2.w1.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.2.w2.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.2.w3.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.20.w1.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.20.w2.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.20.w3.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.21.w1.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.21.w2.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.21.w3.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.22.w1.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.22.w2.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.22.w3.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.23.w1.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.23.w2.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.23.w3.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.24.w1.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.24.w2.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.24.w3.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.25.w1.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.25.w2.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.25.w3.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.26.w1.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.26.w2.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.26.w3.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.27.w1.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.27.w2.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.27.w3.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.28.w1.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.28.w2.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.28.w3.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.29.w1.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.29.w2.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.29.w3.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.3.w1.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.3.w2.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.3.w3.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.30.w1.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.30.w2.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.30.w3.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.31.w1.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.31.w2.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.31.w3.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.32.w1.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.32.w2.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.32.w3.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.33.w1.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.33.w2.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.33.w3.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.34.w1.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.34.w2.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.34.w3.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.35.w1.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.35.w2.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.35.w3.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.36.w1.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.36.w2.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.36.w3.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.37.w1.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.37.w2.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.37.w3.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.38.w1.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.38.w2.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.38.w3.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.39.w1.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.39.w2.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.39.w3.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.4.w1.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.4.w2.weight": "consolidated-00207-of-00272.safetensors", + "layers.51.experts.4.w3.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.40.w1.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.40.w2.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.40.w3.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.41.w1.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.41.w2.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.41.w3.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.42.w1.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.42.w2.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.42.w3.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.43.w1.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.43.w2.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.43.w3.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.44.w1.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.44.w2.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.44.w3.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.45.w1.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.45.w2.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.45.w3.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.46.w1.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.46.w2.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.46.w3.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.47.w1.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.47.w2.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.47.w3.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.48.w1.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.48.w2.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.48.w3.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.49.w1.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.49.w2.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.49.w3.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.5.w1.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.5.w2.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.5.w3.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.50.w1.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.50.w2.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.50.w3.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.51.w1.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.51.w2.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.51.w3.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.52.w1.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.52.w2.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.52.w3.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.53.w1.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.53.w2.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.53.w3.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.54.w1.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.54.w2.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.54.w3.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.55.w1.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.55.w2.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.55.w3.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.56.w1.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.56.w2.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.56.w3.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.57.w1.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.57.w2.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.57.w3.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.58.w1.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.58.w2.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.58.w3.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.59.w1.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.59.w2.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.59.w3.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.6.w1.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.6.w2.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.6.w3.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.60.w1.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.60.w2.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.60.w3.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.61.w1.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.61.w2.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.61.w3.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.62.w1.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.62.w2.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.62.w3.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.63.w1.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.63.w2.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.63.w3.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.64.w1.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.64.w2.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.64.w3.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.65.w1.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.65.w2.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.65.w3.weight": "consolidated-00208-of-00272.safetensors", + "layers.51.experts.66.w1.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.66.w2.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.66.w3.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.67.w1.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.67.w2.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.67.w3.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.68.w1.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.68.w2.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.68.w3.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.69.w1.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.69.w2.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.69.w3.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.7.w1.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.7.w2.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.7.w3.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.70.w1.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.70.w2.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.70.w3.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.71.w1.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.71.w2.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.71.w3.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.72.w1.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.72.w2.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.72.w3.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.73.w1.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.73.w2.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.73.w3.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.74.w1.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.74.w2.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.74.w3.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.75.w1.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.75.w2.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.75.w3.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.76.w1.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.76.w2.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.76.w3.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.77.w1.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.77.w2.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.77.w3.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.78.w1.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.78.w2.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.78.w3.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.79.w1.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.79.w2.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.79.w3.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.8.w1.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.8.w2.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.8.w3.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.80.w1.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.80.w2.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.80.w3.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.81.w1.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.81.w2.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.81.w3.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.82.w1.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.82.w2.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.82.w3.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.83.w1.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.83.w2.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.83.w3.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.84.w1.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.84.w2.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.84.w3.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.85.w1.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.85.w2.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.85.w3.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.86.w1.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.86.w2.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.86.w3.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.87.w1.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.87.w2.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.87.w3.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.88.w1.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.88.w2.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.88.w3.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.89.w1.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.89.w2.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.89.w3.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.9.w1.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.9.w2.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.9.w3.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.90.w1.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.90.w2.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.90.w3.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.91.w1.weight": "consolidated-00209-of-00272.safetensors", + "layers.51.experts.91.w2.weight": "consolidated-00210-of-00272.safetensors", + "layers.51.experts.91.w3.weight": "consolidated-00210-of-00272.safetensors", + "layers.51.experts.92.w1.weight": "consolidated-00210-of-00272.safetensors", + "layers.51.experts.92.w2.weight": "consolidated-00210-of-00272.safetensors", + "layers.51.experts.92.w3.weight": "consolidated-00210-of-00272.safetensors", + "layers.51.experts.93.w1.weight": "consolidated-00210-of-00272.safetensors", + "layers.51.experts.93.w2.weight": "consolidated-00210-of-00272.safetensors", + "layers.51.experts.93.w3.weight": "consolidated-00210-of-00272.safetensors", + "layers.51.experts.94.w1.weight": "consolidated-00210-of-00272.safetensors", + "layers.51.experts.94.w2.weight": "consolidated-00210-of-00272.safetensors", + "layers.51.experts.94.w3.weight": "consolidated-00210-of-00272.safetensors", + "layers.51.experts.95.w1.weight": "consolidated-00210-of-00272.safetensors", + "layers.51.experts.95.w2.weight": "consolidated-00210-of-00272.safetensors", + "layers.51.experts.95.w3.weight": "consolidated-00210-of-00272.safetensors", + "layers.51.experts.96.w1.weight": "consolidated-00210-of-00272.safetensors", + "layers.51.experts.96.w2.weight": "consolidated-00210-of-00272.safetensors", + "layers.51.experts.96.w3.weight": "consolidated-00210-of-00272.safetensors", + "layers.51.experts.97.w1.weight": "consolidated-00210-of-00272.safetensors", + "layers.51.experts.97.w2.weight": "consolidated-00210-of-00272.safetensors", + "layers.51.experts.97.w3.weight": "consolidated-00210-of-00272.safetensors", + "layers.51.experts.98.w1.weight": "consolidated-00210-of-00272.safetensors", + "layers.51.experts.98.w2.weight": "consolidated-00210-of-00272.safetensors", + "layers.51.experts.98.w3.weight": "consolidated-00210-of-00272.safetensors", + "layers.51.experts.99.w1.weight": "consolidated-00210-of-00272.safetensors", + "layers.51.experts.99.w2.weight": "consolidated-00210-of-00272.safetensors", + "layers.51.experts.99.w3.weight": "consolidated-00210-of-00272.safetensors", + "layers.51.ffn_norm.weight": "consolidated-00210-of-00272.safetensors", + "layers.51.gate.weight": "consolidated-00210-of-00272.safetensors", + "layers.51.shared_experts.w1.weight": "consolidated-00210-of-00272.safetensors", + "layers.51.shared_experts.w2.weight": "consolidated-00210-of-00272.safetensors", + "layers.51.shared_experts.w3.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.attention.kv_a_norm.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.attention.q_a_norm.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.attention.wkv_a_with_mqa.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.attention.wkv_b.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.attention.wo.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.attention.wq_a.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.attention.wq_b.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.attention_norm.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.0.w1.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.0.w2.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.0.w3.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.1.w1.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.1.w2.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.1.w3.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.10.w1.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.10.w2.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.10.w3.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.100.w1.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.100.w2.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.100.w3.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.101.w1.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.101.w2.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.101.w3.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.102.w1.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.102.w2.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.102.w3.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.103.w1.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.103.w2.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.103.w3.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.104.w1.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.104.w2.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.104.w3.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.105.w1.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.105.w2.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.105.w3.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.106.w1.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.106.w2.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.106.w3.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.107.w1.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.107.w2.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.107.w3.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.108.w1.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.108.w2.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.108.w3.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.109.w1.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.109.w2.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.109.w3.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.11.w1.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.11.w2.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.11.w3.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.110.w1.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.110.w2.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.110.w3.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.111.w1.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.111.w2.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.111.w3.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.112.w1.weight": "consolidated-00210-of-00272.safetensors", + "layers.52.experts.112.w2.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.112.w3.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.113.w1.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.113.w2.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.113.w3.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.114.w1.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.114.w2.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.114.w3.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.115.w1.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.115.w2.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.115.w3.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.116.w1.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.116.w2.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.116.w3.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.117.w1.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.117.w2.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.117.w3.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.118.w1.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.118.w2.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.118.w3.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.119.w1.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.119.w2.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.119.w3.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.12.w1.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.12.w2.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.12.w3.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.120.w1.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.120.w2.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.120.w3.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.121.w1.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.121.w2.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.121.w3.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.122.w1.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.122.w2.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.122.w3.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.123.w1.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.123.w2.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.123.w3.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.124.w1.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.124.w2.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.124.w3.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.125.w1.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.125.w2.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.125.w3.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.126.w1.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.126.w2.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.126.w3.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.127.w1.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.127.w2.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.127.w3.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.13.w1.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.13.w2.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.13.w3.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.14.w1.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.14.w2.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.14.w3.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.15.w1.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.15.w2.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.15.w3.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.16.w1.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.16.w2.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.16.w3.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.17.w1.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.17.w2.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.17.w3.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.18.w1.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.18.w2.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.18.w3.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.19.w1.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.19.w2.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.19.w3.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.2.w1.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.2.w2.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.2.w3.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.20.w1.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.20.w2.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.20.w3.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.21.w1.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.21.w2.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.21.w3.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.22.w1.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.22.w2.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.22.w3.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.23.w1.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.23.w2.weight": "consolidated-00211-of-00272.safetensors", + "layers.52.experts.23.w3.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.24.w1.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.24.w2.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.24.w3.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.25.w1.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.25.w2.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.25.w3.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.26.w1.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.26.w2.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.26.w3.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.27.w1.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.27.w2.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.27.w3.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.28.w1.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.28.w2.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.28.w3.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.29.w1.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.29.w2.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.29.w3.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.3.w1.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.3.w2.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.3.w3.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.30.w1.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.30.w2.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.30.w3.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.31.w1.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.31.w2.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.31.w3.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.32.w1.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.32.w2.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.32.w3.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.33.w1.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.33.w2.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.33.w3.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.34.w1.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.34.w2.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.34.w3.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.35.w1.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.35.w2.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.35.w3.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.36.w1.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.36.w2.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.36.w3.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.37.w1.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.37.w2.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.37.w3.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.38.w1.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.38.w2.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.38.w3.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.39.w1.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.39.w2.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.39.w3.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.4.w1.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.4.w2.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.4.w3.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.40.w1.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.40.w2.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.40.w3.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.41.w1.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.41.w2.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.41.w3.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.42.w1.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.42.w2.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.42.w3.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.43.w1.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.43.w2.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.43.w3.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.44.w1.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.44.w2.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.44.w3.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.45.w1.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.45.w2.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.45.w3.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.46.w1.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.46.w2.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.46.w3.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.47.w1.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.47.w2.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.47.w3.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.48.w1.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.48.w2.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.48.w3.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.49.w1.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.49.w2.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.49.w3.weight": "consolidated-00212-of-00272.safetensors", + "layers.52.experts.5.w1.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.5.w2.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.5.w3.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.50.w1.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.50.w2.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.50.w3.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.51.w1.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.51.w2.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.51.w3.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.52.w1.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.52.w2.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.52.w3.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.53.w1.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.53.w2.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.53.w3.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.54.w1.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.54.w2.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.54.w3.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.55.w1.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.55.w2.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.55.w3.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.56.w1.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.56.w2.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.56.w3.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.57.w1.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.57.w2.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.57.w3.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.58.w1.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.58.w2.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.58.w3.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.59.w1.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.59.w2.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.59.w3.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.6.w1.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.6.w2.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.6.w3.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.60.w1.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.60.w2.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.60.w3.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.61.w1.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.61.w2.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.61.w3.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.62.w1.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.62.w2.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.62.w3.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.63.w1.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.63.w2.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.63.w3.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.64.w1.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.64.w2.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.64.w3.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.65.w1.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.65.w2.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.65.w3.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.66.w1.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.66.w2.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.66.w3.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.67.w1.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.67.w2.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.67.w3.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.68.w1.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.68.w2.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.68.w3.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.69.w1.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.69.w2.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.69.w3.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.7.w1.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.7.w2.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.7.w3.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.70.w1.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.70.w2.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.70.w3.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.71.w1.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.71.w2.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.71.w3.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.72.w1.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.72.w2.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.72.w3.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.73.w1.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.73.w2.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.73.w3.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.74.w1.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.74.w2.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.74.w3.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.75.w1.weight": "consolidated-00213-of-00272.safetensors", + "layers.52.experts.75.w2.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.75.w3.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.76.w1.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.76.w2.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.76.w3.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.77.w1.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.77.w2.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.77.w3.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.78.w1.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.78.w2.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.78.w3.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.79.w1.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.79.w2.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.79.w3.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.8.w1.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.8.w2.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.8.w3.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.80.w1.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.80.w2.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.80.w3.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.81.w1.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.81.w2.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.81.w3.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.82.w1.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.82.w2.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.82.w3.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.83.w1.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.83.w2.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.83.w3.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.84.w1.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.84.w2.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.84.w3.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.85.w1.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.85.w2.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.85.w3.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.86.w1.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.86.w2.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.86.w3.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.87.w1.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.87.w2.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.87.w3.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.88.w1.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.88.w2.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.88.w3.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.89.w1.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.89.w2.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.89.w3.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.9.w1.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.9.w2.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.9.w3.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.90.w1.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.90.w2.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.90.w3.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.91.w1.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.91.w2.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.91.w3.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.92.w1.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.92.w2.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.92.w3.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.93.w1.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.93.w2.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.93.w3.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.94.w1.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.94.w2.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.94.w3.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.95.w1.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.95.w2.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.95.w3.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.96.w1.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.96.w2.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.96.w3.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.97.w1.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.97.w2.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.97.w3.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.98.w1.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.98.w2.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.98.w3.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.99.w1.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.99.w2.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.experts.99.w3.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.ffn_norm.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.gate.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.shared_experts.w1.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.shared_experts.w2.weight": "consolidated-00214-of-00272.safetensors", + "layers.52.shared_experts.w3.weight": "consolidated-00214-of-00272.safetensors", + "layers.53.attention.kv_a_norm.weight": "consolidated-00214-of-00272.safetensors", + "layers.53.attention.q_a_norm.weight": "consolidated-00214-of-00272.safetensors", + "layers.53.attention.wkv_a_with_mqa.weight": "consolidated-00214-of-00272.safetensors", + "layers.53.attention.wkv_b.weight": "consolidated-00214-of-00272.safetensors", + "layers.53.attention.wo.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.attention.wq_a.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.attention.wq_b.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.attention_norm.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.0.w1.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.0.w2.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.0.w3.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.1.w1.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.1.w2.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.1.w3.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.10.w1.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.10.w2.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.10.w3.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.100.w1.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.100.w2.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.100.w3.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.101.w1.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.101.w2.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.101.w3.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.102.w1.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.102.w2.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.102.w3.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.103.w1.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.103.w2.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.103.w3.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.104.w1.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.104.w2.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.104.w3.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.105.w1.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.105.w2.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.105.w3.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.106.w1.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.106.w2.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.106.w3.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.107.w1.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.107.w2.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.107.w3.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.108.w1.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.108.w2.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.108.w3.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.109.w1.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.109.w2.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.109.w3.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.11.w1.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.11.w2.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.11.w3.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.110.w1.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.110.w2.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.110.w3.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.111.w1.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.111.w2.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.111.w3.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.112.w1.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.112.w2.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.112.w3.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.113.w1.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.113.w2.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.113.w3.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.114.w1.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.114.w2.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.114.w3.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.115.w1.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.115.w2.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.115.w3.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.116.w1.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.116.w2.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.116.w3.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.117.w1.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.117.w2.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.117.w3.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.118.w1.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.118.w2.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.118.w3.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.119.w1.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.119.w2.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.119.w3.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.12.w1.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.12.w2.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.12.w3.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.120.w1.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.120.w2.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.120.w3.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.121.w1.weight": "consolidated-00215-of-00272.safetensors", + "layers.53.experts.121.w2.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.121.w3.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.122.w1.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.122.w2.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.122.w3.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.123.w1.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.123.w2.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.123.w3.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.124.w1.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.124.w2.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.124.w3.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.125.w1.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.125.w2.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.125.w3.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.126.w1.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.126.w2.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.126.w3.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.127.w1.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.127.w2.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.127.w3.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.13.w1.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.13.w2.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.13.w3.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.14.w1.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.14.w2.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.14.w3.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.15.w1.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.15.w2.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.15.w3.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.16.w1.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.16.w2.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.16.w3.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.17.w1.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.17.w2.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.17.w3.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.18.w1.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.18.w2.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.18.w3.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.19.w1.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.19.w2.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.19.w3.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.2.w1.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.2.w2.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.2.w3.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.20.w1.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.20.w2.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.20.w3.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.21.w1.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.21.w2.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.21.w3.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.22.w1.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.22.w2.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.22.w3.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.23.w1.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.23.w2.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.23.w3.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.24.w1.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.24.w2.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.24.w3.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.25.w1.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.25.w2.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.25.w3.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.26.w1.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.26.w2.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.26.w3.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.27.w1.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.27.w2.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.27.w3.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.28.w1.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.28.w2.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.28.w3.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.29.w1.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.29.w2.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.29.w3.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.3.w1.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.3.w2.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.3.w3.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.30.w1.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.30.w2.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.30.w3.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.31.w1.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.31.w2.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.31.w3.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.32.w1.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.32.w2.weight": "consolidated-00216-of-00272.safetensors", + "layers.53.experts.32.w3.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.33.w1.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.33.w2.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.33.w3.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.34.w1.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.34.w2.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.34.w3.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.35.w1.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.35.w2.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.35.w3.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.36.w1.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.36.w2.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.36.w3.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.37.w1.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.37.w2.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.37.w3.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.38.w1.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.38.w2.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.38.w3.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.39.w1.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.39.w2.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.39.w3.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.4.w1.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.4.w2.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.4.w3.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.40.w1.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.40.w2.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.40.w3.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.41.w1.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.41.w2.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.41.w3.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.42.w1.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.42.w2.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.42.w3.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.43.w1.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.43.w2.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.43.w3.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.44.w1.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.44.w2.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.44.w3.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.45.w1.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.45.w2.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.45.w3.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.46.w1.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.46.w2.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.46.w3.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.47.w1.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.47.w2.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.47.w3.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.48.w1.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.48.w2.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.48.w3.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.49.w1.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.49.w2.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.49.w3.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.5.w1.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.5.w2.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.5.w3.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.50.w1.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.50.w2.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.50.w3.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.51.w1.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.51.w2.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.51.w3.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.52.w1.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.52.w2.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.52.w3.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.53.w1.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.53.w2.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.53.w3.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.54.w1.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.54.w2.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.54.w3.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.55.w1.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.55.w2.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.55.w3.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.56.w1.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.56.w2.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.56.w3.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.57.w1.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.57.w2.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.57.w3.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.58.w1.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.58.w2.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.58.w3.weight": "consolidated-00217-of-00272.safetensors", + "layers.53.experts.59.w1.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.59.w2.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.59.w3.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.6.w1.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.6.w2.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.6.w3.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.60.w1.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.60.w2.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.60.w3.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.61.w1.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.61.w2.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.61.w3.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.62.w1.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.62.w2.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.62.w3.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.63.w1.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.63.w2.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.63.w3.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.64.w1.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.64.w2.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.64.w3.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.65.w1.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.65.w2.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.65.w3.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.66.w1.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.66.w2.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.66.w3.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.67.w1.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.67.w2.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.67.w3.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.68.w1.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.68.w2.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.68.w3.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.69.w1.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.69.w2.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.69.w3.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.7.w1.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.7.w2.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.7.w3.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.70.w1.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.70.w2.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.70.w3.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.71.w1.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.71.w2.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.71.w3.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.72.w1.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.72.w2.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.72.w3.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.73.w1.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.73.w2.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.73.w3.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.74.w1.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.74.w2.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.74.w3.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.75.w1.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.75.w2.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.75.w3.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.76.w1.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.76.w2.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.76.w3.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.77.w1.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.77.w2.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.77.w3.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.78.w1.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.78.w2.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.78.w3.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.79.w1.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.79.w2.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.79.w3.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.8.w1.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.8.w2.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.8.w3.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.80.w1.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.80.w2.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.80.w3.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.81.w1.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.81.w2.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.81.w3.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.82.w1.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.82.w2.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.82.w3.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.83.w1.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.83.w2.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.83.w3.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.84.w1.weight": "consolidated-00218-of-00272.safetensors", + "layers.53.experts.84.w2.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.84.w3.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.85.w1.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.85.w2.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.85.w3.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.86.w1.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.86.w2.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.86.w3.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.87.w1.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.87.w2.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.87.w3.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.88.w1.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.88.w2.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.88.w3.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.89.w1.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.89.w2.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.89.w3.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.9.w1.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.9.w2.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.9.w3.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.90.w1.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.90.w2.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.90.w3.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.91.w1.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.91.w2.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.91.w3.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.92.w1.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.92.w2.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.92.w3.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.93.w1.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.93.w2.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.93.w3.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.94.w1.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.94.w2.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.94.w3.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.95.w1.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.95.w2.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.95.w3.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.96.w1.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.96.w2.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.96.w3.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.97.w1.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.97.w2.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.97.w3.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.98.w1.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.98.w2.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.98.w3.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.99.w1.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.99.w2.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.experts.99.w3.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.ffn_norm.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.gate.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.shared_experts.w1.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.shared_experts.w2.weight": "consolidated-00219-of-00272.safetensors", + "layers.53.shared_experts.w3.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.attention.kv_a_norm.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.attention.q_a_norm.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.attention.wkv_a_with_mqa.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.attention.wkv_b.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.attention.wo.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.attention.wq_a.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.attention.wq_b.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.attention_norm.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.experts.0.w1.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.experts.0.w2.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.experts.0.w3.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.experts.1.w1.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.experts.1.w2.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.experts.1.w3.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.experts.10.w1.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.experts.10.w2.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.experts.10.w3.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.experts.100.w1.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.experts.100.w2.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.experts.100.w3.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.experts.101.w1.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.experts.101.w2.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.experts.101.w3.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.experts.102.w1.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.experts.102.w2.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.experts.102.w3.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.experts.103.w1.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.experts.103.w2.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.experts.103.w3.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.experts.104.w1.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.experts.104.w2.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.experts.104.w3.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.experts.105.w1.weight": "consolidated-00219-of-00272.safetensors", + "layers.54.experts.105.w2.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.105.w3.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.106.w1.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.106.w2.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.106.w3.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.107.w1.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.107.w2.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.107.w3.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.108.w1.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.108.w2.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.108.w3.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.109.w1.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.109.w2.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.109.w3.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.11.w1.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.11.w2.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.11.w3.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.110.w1.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.110.w2.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.110.w3.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.111.w1.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.111.w2.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.111.w3.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.112.w1.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.112.w2.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.112.w3.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.113.w1.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.113.w2.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.113.w3.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.114.w1.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.114.w2.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.114.w3.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.115.w1.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.115.w2.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.115.w3.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.116.w1.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.116.w2.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.116.w3.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.117.w1.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.117.w2.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.117.w3.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.118.w1.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.118.w2.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.118.w3.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.119.w1.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.119.w2.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.119.w3.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.12.w1.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.12.w2.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.12.w3.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.120.w1.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.120.w2.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.120.w3.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.121.w1.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.121.w2.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.121.w3.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.122.w1.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.122.w2.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.122.w3.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.123.w1.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.123.w2.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.123.w3.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.124.w1.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.124.w2.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.124.w3.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.125.w1.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.125.w2.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.125.w3.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.126.w1.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.126.w2.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.126.w3.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.127.w1.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.127.w2.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.127.w3.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.13.w1.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.13.w2.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.13.w3.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.14.w1.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.14.w2.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.14.w3.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.15.w1.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.15.w2.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.15.w3.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.16.w1.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.16.w2.weight": "consolidated-00220-of-00272.safetensors", + "layers.54.experts.16.w3.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.17.w1.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.17.w2.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.17.w3.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.18.w1.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.18.w2.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.18.w3.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.19.w1.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.19.w2.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.19.w3.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.2.w1.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.2.w2.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.2.w3.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.20.w1.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.20.w2.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.20.w3.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.21.w1.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.21.w2.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.21.w3.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.22.w1.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.22.w2.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.22.w3.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.23.w1.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.23.w2.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.23.w3.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.24.w1.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.24.w2.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.24.w3.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.25.w1.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.25.w2.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.25.w3.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.26.w1.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.26.w2.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.26.w3.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.27.w1.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.27.w2.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.27.w3.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.28.w1.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.28.w2.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.28.w3.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.29.w1.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.29.w2.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.29.w3.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.3.w1.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.3.w2.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.3.w3.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.30.w1.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.30.w2.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.30.w3.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.31.w1.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.31.w2.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.31.w3.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.32.w1.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.32.w2.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.32.w3.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.33.w1.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.33.w2.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.33.w3.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.34.w1.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.34.w2.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.34.w3.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.35.w1.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.35.w2.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.35.w3.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.36.w1.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.36.w2.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.36.w3.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.37.w1.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.37.w2.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.37.w3.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.38.w1.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.38.w2.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.38.w3.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.39.w1.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.39.w2.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.39.w3.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.4.w1.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.4.w2.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.4.w3.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.40.w1.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.40.w2.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.40.w3.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.41.w1.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.41.w2.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.41.w3.weight": "consolidated-00221-of-00272.safetensors", + "layers.54.experts.42.w1.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.42.w2.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.42.w3.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.43.w1.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.43.w2.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.43.w3.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.44.w1.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.44.w2.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.44.w3.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.45.w1.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.45.w2.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.45.w3.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.46.w1.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.46.w2.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.46.w3.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.47.w1.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.47.w2.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.47.w3.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.48.w1.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.48.w2.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.48.w3.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.49.w1.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.49.w2.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.49.w3.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.5.w1.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.5.w2.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.5.w3.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.50.w1.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.50.w2.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.50.w3.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.51.w1.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.51.w2.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.51.w3.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.52.w1.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.52.w2.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.52.w3.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.53.w1.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.53.w2.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.53.w3.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.54.w1.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.54.w2.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.54.w3.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.55.w1.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.55.w2.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.55.w3.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.56.w1.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.56.w2.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.56.w3.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.57.w1.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.57.w2.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.57.w3.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.58.w1.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.58.w2.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.58.w3.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.59.w1.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.59.w2.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.59.w3.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.6.w1.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.6.w2.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.6.w3.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.60.w1.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.60.w2.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.60.w3.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.61.w1.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.61.w2.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.61.w3.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.62.w1.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.62.w2.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.62.w3.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.63.w1.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.63.w2.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.63.w3.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.64.w1.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.64.w2.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.64.w3.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.65.w1.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.65.w2.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.65.w3.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.66.w1.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.66.w2.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.66.w3.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.67.w1.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.67.w2.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.67.w3.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.68.w1.weight": "consolidated-00222-of-00272.safetensors", + "layers.54.experts.68.w2.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.68.w3.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.69.w1.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.69.w2.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.69.w3.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.7.w1.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.7.w2.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.7.w3.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.70.w1.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.70.w2.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.70.w3.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.71.w1.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.71.w2.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.71.w3.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.72.w1.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.72.w2.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.72.w3.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.73.w1.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.73.w2.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.73.w3.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.74.w1.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.74.w2.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.74.w3.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.75.w1.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.75.w2.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.75.w3.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.76.w1.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.76.w2.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.76.w3.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.77.w1.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.77.w2.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.77.w3.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.78.w1.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.78.w2.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.78.w3.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.79.w1.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.79.w2.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.79.w3.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.8.w1.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.8.w2.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.8.w3.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.80.w1.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.80.w2.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.80.w3.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.81.w1.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.81.w2.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.81.w3.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.82.w1.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.82.w2.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.82.w3.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.83.w1.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.83.w2.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.83.w3.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.84.w1.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.84.w2.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.84.w3.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.85.w1.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.85.w2.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.85.w3.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.86.w1.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.86.w2.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.86.w3.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.87.w1.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.87.w2.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.87.w3.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.88.w1.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.88.w2.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.88.w3.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.89.w1.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.89.w2.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.89.w3.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.9.w1.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.9.w2.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.9.w3.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.90.w1.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.90.w2.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.90.w3.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.91.w1.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.91.w2.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.91.w3.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.92.w1.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.92.w2.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.92.w3.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.93.w1.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.93.w2.weight": "consolidated-00223-of-00272.safetensors", + "layers.54.experts.93.w3.weight": "consolidated-00224-of-00272.safetensors", + "layers.54.experts.94.w1.weight": "consolidated-00224-of-00272.safetensors", + "layers.54.experts.94.w2.weight": "consolidated-00224-of-00272.safetensors", + "layers.54.experts.94.w3.weight": "consolidated-00224-of-00272.safetensors", + "layers.54.experts.95.w1.weight": "consolidated-00224-of-00272.safetensors", + "layers.54.experts.95.w2.weight": "consolidated-00224-of-00272.safetensors", + "layers.54.experts.95.w3.weight": "consolidated-00224-of-00272.safetensors", + "layers.54.experts.96.w1.weight": "consolidated-00224-of-00272.safetensors", + "layers.54.experts.96.w2.weight": "consolidated-00224-of-00272.safetensors", + "layers.54.experts.96.w3.weight": "consolidated-00224-of-00272.safetensors", + "layers.54.experts.97.w1.weight": "consolidated-00224-of-00272.safetensors", + "layers.54.experts.97.w2.weight": "consolidated-00224-of-00272.safetensors", + "layers.54.experts.97.w3.weight": "consolidated-00224-of-00272.safetensors", + "layers.54.experts.98.w1.weight": "consolidated-00224-of-00272.safetensors", + "layers.54.experts.98.w2.weight": "consolidated-00224-of-00272.safetensors", + "layers.54.experts.98.w3.weight": "consolidated-00224-of-00272.safetensors", + "layers.54.experts.99.w1.weight": "consolidated-00224-of-00272.safetensors", + "layers.54.experts.99.w2.weight": "consolidated-00224-of-00272.safetensors", + "layers.54.experts.99.w3.weight": "consolidated-00224-of-00272.safetensors", + "layers.54.ffn_norm.weight": "consolidated-00224-of-00272.safetensors", + "layers.54.gate.weight": "consolidated-00224-of-00272.safetensors", + "layers.54.shared_experts.w1.weight": "consolidated-00224-of-00272.safetensors", + "layers.54.shared_experts.w2.weight": "consolidated-00224-of-00272.safetensors", + "layers.54.shared_experts.w3.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.attention.kv_a_norm.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.attention.q_a_norm.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.attention.wkv_a_with_mqa.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.attention.wkv_b.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.attention.wo.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.attention.wq_a.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.attention.wq_b.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.attention_norm.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.0.w1.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.0.w2.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.0.w3.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.1.w1.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.1.w2.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.1.w3.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.10.w1.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.10.w2.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.10.w3.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.100.w1.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.100.w2.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.100.w3.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.101.w1.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.101.w2.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.101.w3.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.102.w1.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.102.w2.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.102.w3.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.103.w1.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.103.w2.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.103.w3.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.104.w1.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.104.w2.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.104.w3.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.105.w1.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.105.w2.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.105.w3.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.106.w1.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.106.w2.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.106.w3.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.107.w1.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.107.w2.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.107.w3.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.108.w1.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.108.w2.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.108.w3.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.109.w1.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.109.w2.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.109.w3.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.11.w1.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.11.w2.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.11.w3.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.110.w1.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.110.w2.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.110.w3.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.111.w1.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.111.w2.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.111.w3.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.112.w1.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.112.w2.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.112.w3.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.113.w1.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.113.w2.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.113.w3.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.114.w1.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.114.w2.weight": "consolidated-00224-of-00272.safetensors", + "layers.55.experts.114.w3.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.115.w1.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.115.w2.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.115.w3.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.116.w1.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.116.w2.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.116.w3.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.117.w1.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.117.w2.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.117.w3.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.118.w1.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.118.w2.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.118.w3.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.119.w1.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.119.w2.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.119.w3.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.12.w1.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.12.w2.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.12.w3.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.120.w1.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.120.w2.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.120.w3.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.121.w1.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.121.w2.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.121.w3.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.122.w1.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.122.w2.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.122.w3.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.123.w1.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.123.w2.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.123.w3.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.124.w1.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.124.w2.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.124.w3.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.125.w1.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.125.w2.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.125.w3.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.126.w1.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.126.w2.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.126.w3.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.127.w1.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.127.w2.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.127.w3.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.13.w1.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.13.w2.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.13.w3.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.14.w1.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.14.w2.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.14.w3.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.15.w1.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.15.w2.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.15.w3.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.16.w1.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.16.w2.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.16.w3.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.17.w1.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.17.w2.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.17.w3.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.18.w1.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.18.w2.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.18.w3.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.19.w1.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.19.w2.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.19.w3.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.2.w1.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.2.w2.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.2.w3.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.20.w1.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.20.w2.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.20.w3.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.21.w1.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.21.w2.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.21.w3.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.22.w1.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.22.w2.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.22.w3.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.23.w1.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.23.w2.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.23.w3.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.24.w1.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.24.w2.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.24.w3.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.25.w1.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.25.w2.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.25.w3.weight": "consolidated-00225-of-00272.safetensors", + "layers.55.experts.26.w1.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.26.w2.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.26.w3.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.27.w1.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.27.w2.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.27.w3.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.28.w1.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.28.w2.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.28.w3.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.29.w1.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.29.w2.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.29.w3.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.3.w1.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.3.w2.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.3.w3.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.30.w1.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.30.w2.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.30.w3.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.31.w1.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.31.w2.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.31.w3.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.32.w1.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.32.w2.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.32.w3.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.33.w1.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.33.w2.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.33.w3.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.34.w1.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.34.w2.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.34.w3.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.35.w1.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.35.w2.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.35.w3.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.36.w1.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.36.w2.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.36.w3.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.37.w1.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.37.w2.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.37.w3.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.38.w1.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.38.w2.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.38.w3.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.39.w1.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.39.w2.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.39.w3.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.4.w1.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.4.w2.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.4.w3.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.40.w1.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.40.w2.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.40.w3.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.41.w1.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.41.w2.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.41.w3.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.42.w1.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.42.w2.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.42.w3.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.43.w1.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.43.w2.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.43.w3.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.44.w1.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.44.w2.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.44.w3.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.45.w1.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.45.w2.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.45.w3.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.46.w1.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.46.w2.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.46.w3.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.47.w1.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.47.w2.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.47.w3.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.48.w1.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.48.w2.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.48.w3.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.49.w1.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.49.w2.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.49.w3.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.5.w1.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.5.w2.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.5.w3.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.50.w1.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.50.w2.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.50.w3.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.51.w1.weight": "consolidated-00226-of-00272.safetensors", + "layers.55.experts.51.w2.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.51.w3.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.52.w1.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.52.w2.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.52.w3.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.53.w1.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.53.w2.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.53.w3.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.54.w1.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.54.w2.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.54.w3.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.55.w1.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.55.w2.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.55.w3.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.56.w1.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.56.w2.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.56.w3.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.57.w1.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.57.w2.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.57.w3.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.58.w1.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.58.w2.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.58.w3.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.59.w1.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.59.w2.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.59.w3.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.6.w1.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.6.w2.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.6.w3.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.60.w1.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.60.w2.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.60.w3.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.61.w1.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.61.w2.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.61.w3.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.62.w1.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.62.w2.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.62.w3.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.63.w1.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.63.w2.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.63.w3.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.64.w1.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.64.w2.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.64.w3.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.65.w1.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.65.w2.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.65.w3.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.66.w1.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.66.w2.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.66.w3.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.67.w1.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.67.w2.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.67.w3.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.68.w1.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.68.w2.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.68.w3.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.69.w1.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.69.w2.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.69.w3.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.7.w1.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.7.w2.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.7.w3.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.70.w1.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.70.w2.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.70.w3.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.71.w1.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.71.w2.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.71.w3.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.72.w1.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.72.w2.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.72.w3.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.73.w1.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.73.w2.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.73.w3.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.74.w1.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.74.w2.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.74.w3.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.75.w1.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.75.w2.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.75.w3.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.76.w1.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.76.w2.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.76.w3.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.77.w1.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.77.w2.weight": "consolidated-00227-of-00272.safetensors", + "layers.55.experts.77.w3.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.78.w1.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.78.w2.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.78.w3.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.79.w1.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.79.w2.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.79.w3.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.8.w1.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.8.w2.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.8.w3.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.80.w1.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.80.w2.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.80.w3.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.81.w1.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.81.w2.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.81.w3.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.82.w1.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.82.w2.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.82.w3.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.83.w1.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.83.w2.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.83.w3.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.84.w1.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.84.w2.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.84.w3.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.85.w1.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.85.w2.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.85.w3.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.86.w1.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.86.w2.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.86.w3.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.87.w1.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.87.w2.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.87.w3.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.88.w1.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.88.w2.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.88.w3.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.89.w1.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.89.w2.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.89.w3.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.9.w1.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.9.w2.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.9.w3.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.90.w1.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.90.w2.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.90.w3.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.91.w1.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.91.w2.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.91.w3.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.92.w1.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.92.w2.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.92.w3.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.93.w1.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.93.w2.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.93.w3.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.94.w1.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.94.w2.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.94.w3.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.95.w1.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.95.w2.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.95.w3.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.96.w1.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.96.w2.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.96.w3.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.97.w1.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.97.w2.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.97.w3.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.98.w1.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.98.w2.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.98.w3.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.99.w1.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.99.w2.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.experts.99.w3.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.ffn_norm.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.gate.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.shared_experts.w1.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.shared_experts.w2.weight": "consolidated-00228-of-00272.safetensors", + "layers.55.shared_experts.w3.weight": "consolidated-00228-of-00272.safetensors", + "layers.56.attention.kv_a_norm.weight": "consolidated-00228-of-00272.safetensors", + "layers.56.attention.q_a_norm.weight": "consolidated-00228-of-00272.safetensors", + "layers.56.attention.wkv_a_with_mqa.weight": "consolidated-00228-of-00272.safetensors", + "layers.56.attention.wkv_b.weight": "consolidated-00228-of-00272.safetensors", + "layers.56.attention.wo.weight": "consolidated-00228-of-00272.safetensors", + "layers.56.attention.wq_a.weight": "consolidated-00228-of-00272.safetensors", + "layers.56.attention.wq_b.weight": "consolidated-00228-of-00272.safetensors", + "layers.56.attention_norm.weight": "consolidated-00228-of-00272.safetensors", + "layers.56.experts.0.w1.weight": "consolidated-00228-of-00272.safetensors", + "layers.56.experts.0.w2.weight": "consolidated-00228-of-00272.safetensors", + "layers.56.experts.0.w3.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.1.w1.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.1.w2.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.1.w3.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.10.w1.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.10.w2.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.10.w3.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.100.w1.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.100.w2.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.100.w3.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.101.w1.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.101.w2.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.101.w3.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.102.w1.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.102.w2.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.102.w3.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.103.w1.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.103.w2.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.103.w3.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.104.w1.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.104.w2.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.104.w3.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.105.w1.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.105.w2.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.105.w3.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.106.w1.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.106.w2.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.106.w3.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.107.w1.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.107.w2.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.107.w3.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.108.w1.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.108.w2.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.108.w3.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.109.w1.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.109.w2.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.109.w3.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.11.w1.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.11.w2.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.11.w3.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.110.w1.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.110.w2.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.110.w3.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.111.w1.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.111.w2.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.111.w3.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.112.w1.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.112.w2.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.112.w3.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.113.w1.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.113.w2.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.113.w3.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.114.w1.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.114.w2.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.114.w3.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.115.w1.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.115.w2.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.115.w3.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.116.w1.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.116.w2.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.116.w3.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.117.w1.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.117.w2.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.117.w3.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.118.w1.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.118.w2.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.118.w3.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.119.w1.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.119.w2.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.119.w3.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.12.w1.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.12.w2.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.12.w3.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.120.w1.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.120.w2.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.120.w3.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.121.w1.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.121.w2.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.121.w3.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.122.w1.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.122.w2.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.122.w3.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.123.w1.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.123.w2.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.123.w3.weight": "consolidated-00229-of-00272.safetensors", + "layers.56.experts.124.w1.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.124.w2.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.124.w3.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.125.w1.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.125.w2.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.125.w3.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.126.w1.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.126.w2.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.126.w3.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.127.w1.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.127.w2.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.127.w3.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.13.w1.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.13.w2.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.13.w3.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.14.w1.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.14.w2.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.14.w3.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.15.w1.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.15.w2.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.15.w3.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.16.w1.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.16.w2.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.16.w3.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.17.w1.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.17.w2.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.17.w3.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.18.w1.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.18.w2.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.18.w3.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.19.w1.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.19.w2.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.19.w3.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.2.w1.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.2.w2.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.2.w3.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.20.w1.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.20.w2.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.20.w3.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.21.w1.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.21.w2.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.21.w3.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.22.w1.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.22.w2.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.22.w3.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.23.w1.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.23.w2.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.23.w3.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.24.w1.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.24.w2.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.24.w3.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.25.w1.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.25.w2.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.25.w3.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.26.w1.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.26.w2.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.26.w3.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.27.w1.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.27.w2.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.27.w3.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.28.w1.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.28.w2.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.28.w3.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.29.w1.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.29.w2.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.29.w3.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.3.w1.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.3.w2.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.3.w3.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.30.w1.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.30.w2.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.30.w3.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.31.w1.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.31.w2.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.31.w3.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.32.w1.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.32.w2.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.32.w3.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.33.w1.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.33.w2.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.33.w3.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.34.w1.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.34.w2.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.34.w3.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.35.w1.weight": "consolidated-00230-of-00272.safetensors", + "layers.56.experts.35.w2.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.35.w3.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.36.w1.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.36.w2.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.36.w3.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.37.w1.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.37.w2.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.37.w3.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.38.w1.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.38.w2.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.38.w3.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.39.w1.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.39.w2.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.39.w3.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.4.w1.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.4.w2.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.4.w3.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.40.w1.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.40.w2.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.40.w3.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.41.w1.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.41.w2.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.41.w3.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.42.w1.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.42.w2.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.42.w3.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.43.w1.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.43.w2.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.43.w3.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.44.w1.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.44.w2.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.44.w3.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.45.w1.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.45.w2.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.45.w3.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.46.w1.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.46.w2.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.46.w3.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.47.w1.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.47.w2.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.47.w3.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.48.w1.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.48.w2.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.48.w3.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.49.w1.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.49.w2.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.49.w3.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.5.w1.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.5.w2.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.5.w3.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.50.w1.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.50.w2.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.50.w3.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.51.w1.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.51.w2.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.51.w3.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.52.w1.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.52.w2.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.52.w3.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.53.w1.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.53.w2.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.53.w3.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.54.w1.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.54.w2.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.54.w3.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.55.w1.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.55.w2.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.55.w3.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.56.w1.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.56.w2.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.56.w3.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.57.w1.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.57.w2.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.57.w3.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.58.w1.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.58.w2.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.58.w3.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.59.w1.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.59.w2.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.59.w3.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.6.w1.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.6.w2.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.6.w3.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.60.w1.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.60.w2.weight": "consolidated-00231-of-00272.safetensors", + "layers.56.experts.60.w3.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.61.w1.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.61.w2.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.61.w3.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.62.w1.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.62.w2.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.62.w3.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.63.w1.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.63.w2.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.63.w3.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.64.w1.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.64.w2.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.64.w3.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.65.w1.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.65.w2.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.65.w3.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.66.w1.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.66.w2.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.66.w3.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.67.w1.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.67.w2.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.67.w3.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.68.w1.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.68.w2.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.68.w3.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.69.w1.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.69.w2.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.69.w3.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.7.w1.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.7.w2.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.7.w3.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.70.w1.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.70.w2.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.70.w3.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.71.w1.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.71.w2.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.71.w3.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.72.w1.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.72.w2.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.72.w3.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.73.w1.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.73.w2.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.73.w3.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.74.w1.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.74.w2.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.74.w3.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.75.w1.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.75.w2.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.75.w3.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.76.w1.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.76.w2.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.76.w3.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.77.w1.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.77.w2.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.77.w3.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.78.w1.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.78.w2.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.78.w3.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.79.w1.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.79.w2.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.79.w3.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.8.w1.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.8.w2.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.8.w3.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.80.w1.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.80.w2.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.80.w3.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.81.w1.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.81.w2.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.81.w3.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.82.w1.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.82.w2.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.82.w3.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.83.w1.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.83.w2.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.83.w3.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.84.w1.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.84.w2.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.84.w3.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.85.w1.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.85.w2.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.85.w3.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.86.w1.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.86.w2.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.86.w3.weight": "consolidated-00232-of-00272.safetensors", + "layers.56.experts.87.w1.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.87.w2.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.87.w3.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.88.w1.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.88.w2.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.88.w3.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.89.w1.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.89.w2.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.89.w3.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.9.w1.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.9.w2.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.9.w3.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.90.w1.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.90.w2.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.90.w3.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.91.w1.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.91.w2.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.91.w3.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.92.w1.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.92.w2.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.92.w3.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.93.w1.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.93.w2.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.93.w3.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.94.w1.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.94.w2.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.94.w3.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.95.w1.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.95.w2.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.95.w3.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.96.w1.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.96.w2.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.96.w3.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.97.w1.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.97.w2.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.97.w3.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.98.w1.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.98.w2.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.98.w3.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.99.w1.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.99.w2.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.experts.99.w3.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.ffn_norm.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.gate.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.shared_experts.w1.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.shared_experts.w2.weight": "consolidated-00233-of-00272.safetensors", + "layers.56.shared_experts.w3.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.attention.kv_a_norm.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.attention.q_a_norm.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.attention.wkv_a_with_mqa.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.attention.wkv_b.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.attention.wo.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.attention.wq_a.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.attention.wq_b.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.attention_norm.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.0.w1.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.0.w2.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.0.w3.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.1.w1.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.1.w2.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.1.w3.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.10.w1.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.10.w2.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.10.w3.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.100.w1.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.100.w2.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.100.w3.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.101.w1.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.101.w2.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.101.w3.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.102.w1.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.102.w2.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.102.w3.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.103.w1.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.103.w2.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.103.w3.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.104.w1.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.104.w2.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.104.w3.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.105.w1.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.105.w2.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.105.w3.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.106.w1.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.106.w2.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.106.w3.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.107.w1.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.107.w2.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.107.w3.weight": "consolidated-00233-of-00272.safetensors", + "layers.57.experts.108.w1.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.108.w2.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.108.w3.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.109.w1.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.109.w2.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.109.w3.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.11.w1.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.11.w2.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.11.w3.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.110.w1.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.110.w2.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.110.w3.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.111.w1.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.111.w2.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.111.w3.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.112.w1.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.112.w2.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.112.w3.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.113.w1.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.113.w2.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.113.w3.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.114.w1.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.114.w2.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.114.w3.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.115.w1.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.115.w2.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.115.w3.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.116.w1.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.116.w2.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.116.w3.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.117.w1.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.117.w2.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.117.w3.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.118.w1.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.118.w2.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.118.w3.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.119.w1.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.119.w2.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.119.w3.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.12.w1.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.12.w2.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.12.w3.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.120.w1.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.120.w2.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.120.w3.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.121.w1.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.121.w2.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.121.w3.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.122.w1.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.122.w2.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.122.w3.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.123.w1.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.123.w2.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.123.w3.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.124.w1.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.124.w2.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.124.w3.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.125.w1.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.125.w2.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.125.w3.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.126.w1.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.126.w2.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.126.w3.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.127.w1.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.127.w2.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.127.w3.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.13.w1.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.13.w2.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.13.w3.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.14.w1.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.14.w2.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.14.w3.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.15.w1.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.15.w2.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.15.w3.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.16.w1.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.16.w2.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.16.w3.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.17.w1.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.17.w2.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.17.w3.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.18.w1.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.18.w2.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.18.w3.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.19.w1.weight": "consolidated-00234-of-00272.safetensors", + "layers.57.experts.19.w2.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.19.w3.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.2.w1.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.2.w2.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.2.w3.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.20.w1.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.20.w2.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.20.w3.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.21.w1.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.21.w2.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.21.w3.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.22.w1.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.22.w2.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.22.w3.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.23.w1.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.23.w2.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.23.w3.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.24.w1.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.24.w2.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.24.w3.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.25.w1.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.25.w2.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.25.w3.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.26.w1.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.26.w2.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.26.w3.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.27.w1.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.27.w2.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.27.w3.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.28.w1.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.28.w2.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.28.w3.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.29.w1.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.29.w2.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.29.w3.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.3.w1.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.3.w2.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.3.w3.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.30.w1.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.30.w2.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.30.w3.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.31.w1.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.31.w2.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.31.w3.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.32.w1.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.32.w2.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.32.w3.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.33.w1.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.33.w2.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.33.w3.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.34.w1.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.34.w2.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.34.w3.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.35.w1.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.35.w2.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.35.w3.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.36.w1.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.36.w2.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.36.w3.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.37.w1.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.37.w2.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.37.w3.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.38.w1.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.38.w2.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.38.w3.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.39.w1.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.39.w2.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.39.w3.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.4.w1.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.4.w2.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.4.w3.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.40.w1.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.40.w2.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.40.w3.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.41.w1.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.41.w2.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.41.w3.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.42.w1.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.42.w2.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.42.w3.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.43.w1.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.43.w2.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.43.w3.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.44.w1.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.44.w2.weight": "consolidated-00235-of-00272.safetensors", + "layers.57.experts.44.w3.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.45.w1.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.45.w2.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.45.w3.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.46.w1.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.46.w2.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.46.w3.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.47.w1.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.47.w2.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.47.w3.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.48.w1.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.48.w2.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.48.w3.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.49.w1.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.49.w2.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.49.w3.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.5.w1.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.5.w2.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.5.w3.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.50.w1.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.50.w2.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.50.w3.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.51.w1.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.51.w2.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.51.w3.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.52.w1.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.52.w2.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.52.w3.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.53.w1.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.53.w2.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.53.w3.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.54.w1.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.54.w2.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.54.w3.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.55.w1.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.55.w2.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.55.w3.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.56.w1.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.56.w2.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.56.w3.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.57.w1.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.57.w2.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.57.w3.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.58.w1.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.58.w2.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.58.w3.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.59.w1.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.59.w2.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.59.w3.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.6.w1.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.6.w2.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.6.w3.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.60.w1.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.60.w2.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.60.w3.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.61.w1.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.61.w2.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.61.w3.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.62.w1.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.62.w2.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.62.w3.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.63.w1.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.63.w2.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.63.w3.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.64.w1.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.64.w2.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.64.w3.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.65.w1.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.65.w2.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.65.w3.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.66.w1.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.66.w2.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.66.w3.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.67.w1.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.67.w2.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.67.w3.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.68.w1.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.68.w2.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.68.w3.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.69.w1.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.69.w2.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.69.w3.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.7.w1.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.7.w2.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.7.w3.weight": "consolidated-00236-of-00272.safetensors", + "layers.57.experts.70.w1.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.70.w2.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.70.w3.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.71.w1.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.71.w2.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.71.w3.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.72.w1.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.72.w2.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.72.w3.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.73.w1.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.73.w2.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.73.w3.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.74.w1.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.74.w2.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.74.w3.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.75.w1.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.75.w2.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.75.w3.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.76.w1.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.76.w2.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.76.w3.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.77.w1.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.77.w2.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.77.w3.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.78.w1.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.78.w2.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.78.w3.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.79.w1.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.79.w2.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.79.w3.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.8.w1.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.8.w2.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.8.w3.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.80.w1.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.80.w2.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.80.w3.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.81.w1.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.81.w2.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.81.w3.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.82.w1.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.82.w2.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.82.w3.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.83.w1.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.83.w2.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.83.w3.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.84.w1.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.84.w2.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.84.w3.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.85.w1.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.85.w2.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.85.w3.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.86.w1.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.86.w2.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.86.w3.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.87.w1.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.87.w2.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.87.w3.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.88.w1.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.88.w2.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.88.w3.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.89.w1.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.89.w2.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.89.w3.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.9.w1.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.9.w2.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.9.w3.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.90.w1.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.90.w2.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.90.w3.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.91.w1.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.91.w2.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.91.w3.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.92.w1.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.92.w2.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.92.w3.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.93.w1.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.93.w2.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.93.w3.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.94.w1.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.94.w2.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.94.w3.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.95.w1.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.95.w2.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.95.w3.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.96.w1.weight": "consolidated-00237-of-00272.safetensors", + "layers.57.experts.96.w2.weight": "consolidated-00238-of-00272.safetensors", + "layers.57.experts.96.w3.weight": "consolidated-00238-of-00272.safetensors", + "layers.57.experts.97.w1.weight": "consolidated-00238-of-00272.safetensors", + "layers.57.experts.97.w2.weight": "consolidated-00238-of-00272.safetensors", + "layers.57.experts.97.w3.weight": "consolidated-00238-of-00272.safetensors", + "layers.57.experts.98.w1.weight": "consolidated-00238-of-00272.safetensors", + "layers.57.experts.98.w2.weight": "consolidated-00238-of-00272.safetensors", + "layers.57.experts.98.w3.weight": "consolidated-00238-of-00272.safetensors", + "layers.57.experts.99.w1.weight": "consolidated-00238-of-00272.safetensors", + "layers.57.experts.99.w2.weight": "consolidated-00238-of-00272.safetensors", + "layers.57.experts.99.w3.weight": "consolidated-00238-of-00272.safetensors", + "layers.57.ffn_norm.weight": "consolidated-00238-of-00272.safetensors", + "layers.57.gate.weight": "consolidated-00238-of-00272.safetensors", + "layers.57.shared_experts.w1.weight": "consolidated-00238-of-00272.safetensors", + "layers.57.shared_experts.w2.weight": "consolidated-00238-of-00272.safetensors", + "layers.57.shared_experts.w3.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.attention.kv_a_norm.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.attention.q_a_norm.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.attention.wkv_a_with_mqa.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.attention.wkv_b.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.attention.wo.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.attention.wq_a.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.attention.wq_b.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.attention_norm.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.0.w1.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.0.w2.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.0.w3.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.1.w1.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.1.w2.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.1.w3.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.10.w1.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.10.w2.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.10.w3.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.100.w1.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.100.w2.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.100.w3.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.101.w1.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.101.w2.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.101.w3.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.102.w1.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.102.w2.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.102.w3.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.103.w1.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.103.w2.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.103.w3.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.104.w1.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.104.w2.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.104.w3.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.105.w1.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.105.w2.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.105.w3.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.106.w1.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.106.w2.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.106.w3.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.107.w1.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.107.w2.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.107.w3.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.108.w1.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.108.w2.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.108.w3.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.109.w1.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.109.w2.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.109.w3.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.11.w1.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.11.w2.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.11.w3.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.110.w1.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.110.w2.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.110.w3.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.111.w1.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.111.w2.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.111.w3.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.112.w1.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.112.w2.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.112.w3.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.113.w1.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.113.w2.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.113.w3.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.114.w1.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.114.w2.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.114.w3.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.115.w1.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.115.w2.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.115.w3.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.116.w1.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.116.w2.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.116.w3.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.117.w1.weight": "consolidated-00238-of-00272.safetensors", + "layers.58.experts.117.w2.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.117.w3.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.118.w1.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.118.w2.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.118.w3.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.119.w1.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.119.w2.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.119.w3.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.12.w1.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.12.w2.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.12.w3.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.120.w1.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.120.w2.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.120.w3.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.121.w1.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.121.w2.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.121.w3.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.122.w1.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.122.w2.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.122.w3.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.123.w1.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.123.w2.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.123.w3.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.124.w1.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.124.w2.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.124.w3.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.125.w1.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.125.w2.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.125.w3.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.126.w1.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.126.w2.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.126.w3.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.127.w1.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.127.w2.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.127.w3.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.13.w1.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.13.w2.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.13.w3.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.14.w1.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.14.w2.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.14.w3.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.15.w1.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.15.w2.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.15.w3.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.16.w1.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.16.w2.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.16.w3.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.17.w1.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.17.w2.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.17.w3.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.18.w1.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.18.w2.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.18.w3.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.19.w1.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.19.w2.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.19.w3.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.2.w1.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.2.w2.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.2.w3.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.20.w1.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.20.w2.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.20.w3.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.21.w1.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.21.w2.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.21.w3.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.22.w1.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.22.w2.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.22.w3.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.23.w1.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.23.w2.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.23.w3.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.24.w1.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.24.w2.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.24.w3.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.25.w1.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.25.w2.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.25.w3.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.26.w1.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.26.w2.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.26.w3.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.27.w1.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.27.w2.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.27.w3.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.28.w1.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.28.w2.weight": "consolidated-00239-of-00272.safetensors", + "layers.58.experts.28.w3.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.29.w1.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.29.w2.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.29.w3.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.3.w1.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.3.w2.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.3.w3.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.30.w1.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.30.w2.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.30.w3.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.31.w1.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.31.w2.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.31.w3.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.32.w1.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.32.w2.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.32.w3.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.33.w1.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.33.w2.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.33.w3.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.34.w1.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.34.w2.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.34.w3.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.35.w1.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.35.w2.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.35.w3.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.36.w1.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.36.w2.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.36.w3.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.37.w1.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.37.w2.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.37.w3.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.38.w1.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.38.w2.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.38.w3.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.39.w1.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.39.w2.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.39.w3.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.4.w1.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.4.w2.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.4.w3.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.40.w1.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.40.w2.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.40.w3.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.41.w1.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.41.w2.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.41.w3.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.42.w1.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.42.w2.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.42.w3.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.43.w1.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.43.w2.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.43.w3.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.44.w1.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.44.w2.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.44.w3.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.45.w1.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.45.w2.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.45.w3.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.46.w1.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.46.w2.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.46.w3.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.47.w1.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.47.w2.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.47.w3.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.48.w1.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.48.w2.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.48.w3.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.49.w1.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.49.w2.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.49.w3.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.5.w1.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.5.w2.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.5.w3.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.50.w1.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.50.w2.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.50.w3.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.51.w1.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.51.w2.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.51.w3.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.52.w1.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.52.w2.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.52.w3.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.53.w1.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.53.w2.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.53.w3.weight": "consolidated-00240-of-00272.safetensors", + "layers.58.experts.54.w1.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.54.w2.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.54.w3.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.55.w1.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.55.w2.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.55.w3.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.56.w1.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.56.w2.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.56.w3.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.57.w1.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.57.w2.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.57.w3.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.58.w1.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.58.w2.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.58.w3.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.59.w1.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.59.w2.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.59.w3.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.6.w1.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.6.w2.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.6.w3.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.60.w1.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.60.w2.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.60.w3.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.61.w1.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.61.w2.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.61.w3.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.62.w1.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.62.w2.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.62.w3.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.63.w1.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.63.w2.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.63.w3.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.64.w1.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.64.w2.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.64.w3.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.65.w1.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.65.w2.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.65.w3.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.66.w1.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.66.w2.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.66.w3.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.67.w1.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.67.w2.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.67.w3.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.68.w1.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.68.w2.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.68.w3.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.69.w1.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.69.w2.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.69.w3.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.7.w1.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.7.w2.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.7.w3.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.70.w1.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.70.w2.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.70.w3.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.71.w1.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.71.w2.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.71.w3.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.72.w1.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.72.w2.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.72.w3.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.73.w1.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.73.w2.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.73.w3.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.74.w1.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.74.w2.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.74.w3.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.75.w1.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.75.w2.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.75.w3.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.76.w1.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.76.w2.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.76.w3.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.77.w1.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.77.w2.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.77.w3.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.78.w1.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.78.w2.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.78.w3.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.79.w1.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.79.w2.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.79.w3.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.8.w1.weight": "consolidated-00241-of-00272.safetensors", + "layers.58.experts.8.w2.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.8.w3.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.80.w1.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.80.w2.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.80.w3.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.81.w1.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.81.w2.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.81.w3.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.82.w1.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.82.w2.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.82.w3.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.83.w1.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.83.w2.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.83.w3.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.84.w1.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.84.w2.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.84.w3.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.85.w1.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.85.w2.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.85.w3.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.86.w1.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.86.w2.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.86.w3.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.87.w1.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.87.w2.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.87.w3.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.88.w1.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.88.w2.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.88.w3.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.89.w1.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.89.w2.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.89.w3.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.9.w1.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.9.w2.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.9.w3.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.90.w1.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.90.w2.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.90.w3.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.91.w1.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.91.w2.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.91.w3.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.92.w1.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.92.w2.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.92.w3.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.93.w1.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.93.w2.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.93.w3.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.94.w1.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.94.w2.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.94.w3.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.95.w1.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.95.w2.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.95.w3.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.96.w1.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.96.w2.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.96.w3.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.97.w1.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.97.w2.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.97.w3.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.98.w1.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.98.w2.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.98.w3.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.99.w1.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.99.w2.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.experts.99.w3.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.ffn_norm.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.gate.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.shared_experts.w1.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.shared_experts.w2.weight": "consolidated-00242-of-00272.safetensors", + "layers.58.shared_experts.w3.weight": "consolidated-00242-of-00272.safetensors", + "layers.59.attention.kv_a_norm.weight": "consolidated-00242-of-00272.safetensors", + "layers.59.attention.q_a_norm.weight": "consolidated-00242-of-00272.safetensors", + "layers.59.attention.wkv_a_with_mqa.weight": "consolidated-00242-of-00272.safetensors", + "layers.59.attention.wkv_b.weight": "consolidated-00242-of-00272.safetensors", + "layers.59.attention.wo.weight": "consolidated-00242-of-00272.safetensors", + "layers.59.attention.wq_a.weight": "consolidated-00242-of-00272.safetensors", + "layers.59.attention.wq_b.weight": "consolidated-00242-of-00272.safetensors", + "layers.59.attention_norm.weight": "consolidated-00242-of-00272.safetensors", + "layers.59.experts.0.w1.weight": "consolidated-00242-of-00272.safetensors", + "layers.59.experts.0.w2.weight": "consolidated-00242-of-00272.safetensors", + "layers.59.experts.0.w3.weight": "consolidated-00242-of-00272.safetensors", + "layers.59.experts.1.w1.weight": "consolidated-00242-of-00272.safetensors", + "layers.59.experts.1.w2.weight": "consolidated-00242-of-00272.safetensors", + "layers.59.experts.1.w3.weight": "consolidated-00242-of-00272.safetensors", + "layers.59.experts.10.w1.weight": "consolidated-00242-of-00272.safetensors", + "layers.59.experts.10.w2.weight": "consolidated-00242-of-00272.safetensors", + "layers.59.experts.10.w3.weight": "consolidated-00242-of-00272.safetensors", + "layers.59.experts.100.w1.weight": "consolidated-00242-of-00272.safetensors", + "layers.59.experts.100.w2.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.100.w3.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.101.w1.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.101.w2.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.101.w3.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.102.w1.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.102.w2.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.102.w3.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.103.w1.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.103.w2.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.103.w3.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.104.w1.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.104.w2.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.104.w3.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.105.w1.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.105.w2.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.105.w3.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.106.w1.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.106.w2.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.106.w3.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.107.w1.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.107.w2.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.107.w3.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.108.w1.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.108.w2.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.108.w3.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.109.w1.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.109.w2.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.109.w3.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.11.w1.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.11.w2.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.11.w3.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.110.w1.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.110.w2.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.110.w3.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.111.w1.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.111.w2.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.111.w3.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.112.w1.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.112.w2.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.112.w3.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.113.w1.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.113.w2.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.113.w3.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.114.w1.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.114.w2.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.114.w3.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.115.w1.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.115.w2.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.115.w3.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.116.w1.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.116.w2.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.116.w3.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.117.w1.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.117.w2.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.117.w3.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.118.w1.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.118.w2.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.118.w3.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.119.w1.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.119.w2.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.119.w3.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.12.w1.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.12.w2.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.12.w3.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.120.w1.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.120.w2.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.120.w3.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.121.w1.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.121.w2.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.121.w3.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.122.w1.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.122.w2.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.122.w3.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.123.w1.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.123.w2.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.123.w3.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.124.w1.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.124.w2.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.124.w3.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.125.w1.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.125.w2.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.125.w3.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.126.w1.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.126.w2.weight": "consolidated-00243-of-00272.safetensors", + "layers.59.experts.126.w3.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.127.w1.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.127.w2.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.127.w3.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.13.w1.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.13.w2.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.13.w3.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.14.w1.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.14.w2.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.14.w3.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.15.w1.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.15.w2.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.15.w3.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.16.w1.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.16.w2.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.16.w3.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.17.w1.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.17.w2.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.17.w3.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.18.w1.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.18.w2.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.18.w3.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.19.w1.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.19.w2.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.19.w3.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.2.w1.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.2.w2.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.2.w3.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.20.w1.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.20.w2.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.20.w3.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.21.w1.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.21.w2.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.21.w3.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.22.w1.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.22.w2.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.22.w3.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.23.w1.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.23.w2.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.23.w3.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.24.w1.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.24.w2.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.24.w3.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.25.w1.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.25.w2.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.25.w3.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.26.w1.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.26.w2.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.26.w3.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.27.w1.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.27.w2.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.27.w3.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.28.w1.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.28.w2.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.28.w3.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.29.w1.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.29.w2.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.29.w3.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.3.w1.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.3.w2.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.3.w3.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.30.w1.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.30.w2.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.30.w3.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.31.w1.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.31.w2.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.31.w3.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.32.w1.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.32.w2.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.32.w3.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.33.w1.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.33.w2.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.33.w3.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.34.w1.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.34.w2.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.34.w3.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.35.w1.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.35.w2.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.35.w3.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.36.w1.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.36.w2.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.36.w3.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.37.w1.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.37.w2.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.37.w3.weight": "consolidated-00244-of-00272.safetensors", + "layers.59.experts.38.w1.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.38.w2.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.38.w3.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.39.w1.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.39.w2.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.39.w3.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.4.w1.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.4.w2.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.4.w3.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.40.w1.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.40.w2.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.40.w3.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.41.w1.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.41.w2.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.41.w3.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.42.w1.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.42.w2.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.42.w3.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.43.w1.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.43.w2.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.43.w3.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.44.w1.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.44.w2.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.44.w3.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.45.w1.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.45.w2.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.45.w3.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.46.w1.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.46.w2.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.46.w3.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.47.w1.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.47.w2.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.47.w3.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.48.w1.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.48.w2.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.48.w3.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.49.w1.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.49.w2.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.49.w3.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.5.w1.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.5.w2.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.5.w3.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.50.w1.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.50.w2.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.50.w3.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.51.w1.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.51.w2.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.51.w3.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.52.w1.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.52.w2.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.52.w3.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.53.w1.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.53.w2.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.53.w3.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.54.w1.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.54.w2.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.54.w3.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.55.w1.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.55.w2.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.55.w3.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.56.w1.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.56.w2.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.56.w3.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.57.w1.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.57.w2.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.57.w3.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.58.w1.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.58.w2.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.58.w3.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.59.w1.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.59.w2.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.59.w3.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.6.w1.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.6.w2.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.6.w3.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.60.w1.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.60.w2.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.60.w3.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.61.w1.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.61.w2.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.61.w3.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.62.w1.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.62.w2.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.62.w3.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.63.w1.weight": "consolidated-00245-of-00272.safetensors", + "layers.59.experts.63.w2.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.63.w3.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.64.w1.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.64.w2.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.64.w3.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.65.w1.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.65.w2.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.65.w3.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.66.w1.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.66.w2.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.66.w3.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.67.w1.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.67.w2.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.67.w3.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.68.w1.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.68.w2.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.68.w3.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.69.w1.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.69.w2.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.69.w3.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.7.w1.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.7.w2.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.7.w3.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.70.w1.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.70.w2.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.70.w3.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.71.w1.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.71.w2.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.71.w3.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.72.w1.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.72.w2.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.72.w3.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.73.w1.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.73.w2.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.73.w3.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.74.w1.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.74.w2.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.74.w3.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.75.w1.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.75.w2.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.75.w3.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.76.w1.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.76.w2.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.76.w3.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.77.w1.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.77.w2.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.77.w3.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.78.w1.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.78.w2.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.78.w3.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.79.w1.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.79.w2.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.79.w3.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.8.w1.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.8.w2.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.8.w3.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.80.w1.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.80.w2.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.80.w3.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.81.w1.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.81.w2.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.81.w3.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.82.w1.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.82.w2.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.82.w3.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.83.w1.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.83.w2.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.83.w3.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.84.w1.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.84.w2.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.84.w3.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.85.w1.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.85.w2.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.85.w3.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.86.w1.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.86.w2.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.86.w3.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.87.w1.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.87.w2.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.87.w3.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.88.w1.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.88.w2.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.88.w3.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.89.w1.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.89.w2.weight": "consolidated-00246-of-00272.safetensors", + "layers.59.experts.89.w3.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.9.w1.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.9.w2.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.9.w3.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.90.w1.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.90.w2.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.90.w3.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.91.w1.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.91.w2.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.91.w3.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.92.w1.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.92.w2.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.92.w3.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.93.w1.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.93.w2.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.93.w3.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.94.w1.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.94.w2.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.94.w3.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.95.w1.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.95.w2.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.95.w3.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.96.w1.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.96.w2.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.96.w3.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.97.w1.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.97.w2.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.97.w3.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.98.w1.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.98.w2.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.98.w3.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.99.w1.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.99.w2.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.experts.99.w3.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.ffn_norm.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.gate.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.shared_experts.w1.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.shared_experts.w2.weight": "consolidated-00247-of-00272.safetensors", + "layers.59.shared_experts.w3.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.attention.kv_a_norm.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.attention.q_a_norm.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.attention.wkv_a_with_mqa.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.attention.wkv_b.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.attention.wo.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.attention.wq_a.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.attention.wq_b.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.attention_norm.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.0.w1.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.0.w2.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.0.w3.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.1.w1.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.1.w2.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.1.w3.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.10.w1.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.10.w2.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.10.w3.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.100.w1.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.100.w2.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.100.w3.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.101.w1.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.101.w2.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.101.w3.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.102.w1.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.102.w2.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.102.w3.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.103.w1.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.103.w2.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.103.w3.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.104.w1.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.104.w2.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.104.w3.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.105.w1.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.105.w2.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.105.w3.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.106.w1.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.106.w2.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.106.w3.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.107.w1.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.107.w2.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.107.w3.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.108.w1.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.108.w2.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.108.w3.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.109.w1.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.109.w2.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.109.w3.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.11.w1.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.11.w2.weight": "consolidated-00247-of-00272.safetensors", + "layers.6.experts.11.w3.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.110.w1.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.110.w2.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.110.w3.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.111.w1.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.111.w2.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.111.w3.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.112.w1.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.112.w2.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.112.w3.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.113.w1.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.113.w2.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.113.w3.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.114.w1.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.114.w2.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.114.w3.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.115.w1.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.115.w2.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.115.w3.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.116.w1.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.116.w2.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.116.w3.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.117.w1.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.117.w2.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.117.w3.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.118.w1.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.118.w2.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.118.w3.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.119.w1.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.119.w2.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.119.w3.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.12.w1.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.12.w2.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.12.w3.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.120.w1.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.120.w2.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.120.w3.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.121.w1.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.121.w2.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.121.w3.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.122.w1.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.122.w2.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.122.w3.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.123.w1.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.123.w2.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.123.w3.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.124.w1.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.124.w2.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.124.w3.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.125.w1.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.125.w2.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.125.w3.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.126.w1.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.126.w2.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.126.w3.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.127.w1.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.127.w2.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.127.w3.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.13.w1.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.13.w2.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.13.w3.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.14.w1.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.14.w2.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.14.w3.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.15.w1.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.15.w2.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.15.w3.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.16.w1.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.16.w2.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.16.w3.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.17.w1.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.17.w2.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.17.w3.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.18.w1.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.18.w2.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.18.w3.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.19.w1.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.19.w2.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.19.w3.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.2.w1.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.2.w2.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.2.w3.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.20.w1.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.20.w2.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.20.w3.weight": "consolidated-00248-of-00272.safetensors", + "layers.6.experts.21.w1.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.21.w2.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.21.w3.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.22.w1.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.22.w2.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.22.w3.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.23.w1.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.23.w2.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.23.w3.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.24.w1.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.24.w2.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.24.w3.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.25.w1.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.25.w2.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.25.w3.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.26.w1.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.26.w2.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.26.w3.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.27.w1.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.27.w2.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.27.w3.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.28.w1.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.28.w2.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.28.w3.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.29.w1.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.29.w2.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.29.w3.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.3.w1.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.3.w2.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.3.w3.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.30.w1.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.30.w2.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.30.w3.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.31.w1.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.31.w2.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.31.w3.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.32.w1.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.32.w2.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.32.w3.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.33.w1.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.33.w2.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.33.w3.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.34.w1.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.34.w2.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.34.w3.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.35.w1.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.35.w2.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.35.w3.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.36.w1.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.36.w2.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.36.w3.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.37.w1.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.37.w2.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.37.w3.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.38.w1.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.38.w2.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.38.w3.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.39.w1.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.39.w2.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.39.w3.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.4.w1.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.4.w2.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.4.w3.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.40.w1.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.40.w2.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.40.w3.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.41.w1.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.41.w2.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.41.w3.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.42.w1.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.42.w2.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.42.w3.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.43.w1.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.43.w2.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.43.w3.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.44.w1.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.44.w2.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.44.w3.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.45.w1.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.45.w2.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.45.w3.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.46.w1.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.46.w2.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.46.w3.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.47.w1.weight": "consolidated-00249-of-00272.safetensors", + "layers.6.experts.47.w2.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.47.w3.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.48.w1.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.48.w2.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.48.w3.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.49.w1.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.49.w2.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.49.w3.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.5.w1.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.5.w2.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.5.w3.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.50.w1.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.50.w2.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.50.w3.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.51.w1.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.51.w2.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.51.w3.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.52.w1.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.52.w2.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.52.w3.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.53.w1.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.53.w2.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.53.w3.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.54.w1.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.54.w2.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.54.w3.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.55.w1.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.55.w2.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.55.w3.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.56.w1.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.56.w2.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.56.w3.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.57.w1.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.57.w2.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.57.w3.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.58.w1.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.58.w2.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.58.w3.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.59.w1.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.59.w2.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.59.w3.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.6.w1.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.6.w2.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.6.w3.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.60.w1.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.60.w2.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.60.w3.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.61.w1.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.61.w2.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.61.w3.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.62.w1.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.62.w2.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.62.w3.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.63.w1.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.63.w2.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.63.w3.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.64.w1.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.64.w2.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.64.w3.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.65.w1.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.65.w2.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.65.w3.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.66.w1.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.66.w2.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.66.w3.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.67.w1.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.67.w2.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.67.w3.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.68.w1.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.68.w2.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.68.w3.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.69.w1.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.69.w2.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.69.w3.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.7.w1.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.7.w2.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.7.w3.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.70.w1.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.70.w2.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.70.w3.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.71.w1.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.71.w2.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.71.w3.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.72.w1.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.72.w2.weight": "consolidated-00250-of-00272.safetensors", + "layers.6.experts.72.w3.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.73.w1.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.73.w2.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.73.w3.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.74.w1.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.74.w2.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.74.w3.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.75.w1.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.75.w2.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.75.w3.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.76.w1.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.76.w2.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.76.w3.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.77.w1.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.77.w2.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.77.w3.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.78.w1.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.78.w2.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.78.w3.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.79.w1.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.79.w2.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.79.w3.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.8.w1.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.8.w2.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.8.w3.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.80.w1.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.80.w2.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.80.w3.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.81.w1.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.81.w2.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.81.w3.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.82.w1.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.82.w2.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.82.w3.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.83.w1.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.83.w2.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.83.w3.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.84.w1.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.84.w2.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.84.w3.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.85.w1.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.85.w2.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.85.w3.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.86.w1.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.86.w2.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.86.w3.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.87.w1.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.87.w2.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.87.w3.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.88.w1.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.88.w2.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.88.w3.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.89.w1.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.89.w2.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.89.w3.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.9.w1.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.9.w2.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.9.w3.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.90.w1.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.90.w2.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.90.w3.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.91.w1.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.91.w2.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.91.w3.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.92.w1.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.92.w2.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.92.w3.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.93.w1.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.93.w2.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.93.w3.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.94.w1.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.94.w2.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.94.w3.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.95.w1.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.95.w2.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.95.w3.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.96.w1.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.96.w2.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.96.w3.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.97.w1.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.97.w2.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.97.w3.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.98.w1.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.98.w2.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.98.w3.weight": "consolidated-00251-of-00272.safetensors", + "layers.6.experts.99.w1.weight": "consolidated-00252-of-00272.safetensors", + "layers.6.experts.99.w2.weight": "consolidated-00252-of-00272.safetensors", + "layers.6.experts.99.w3.weight": "consolidated-00252-of-00272.safetensors", + "layers.6.ffn_norm.weight": "consolidated-00252-of-00272.safetensors", + "layers.6.gate.weight": "consolidated-00252-of-00272.safetensors", + "layers.6.shared_experts.w1.weight": "consolidated-00252-of-00272.safetensors", + "layers.6.shared_experts.w2.weight": "consolidated-00252-of-00272.safetensors", + "layers.6.shared_experts.w3.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.attention.kv_a_norm.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.attention.q_a_norm.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.attention.wkv_a_with_mqa.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.attention.wkv_b.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.attention.wo.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.attention.wq_a.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.attention.wq_b.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.attention_norm.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.0.w1.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.0.w2.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.0.w3.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.1.w1.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.1.w2.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.1.w3.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.10.w1.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.10.w2.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.10.w3.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.100.w1.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.100.w2.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.100.w3.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.101.w1.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.101.w2.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.101.w3.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.102.w1.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.102.w2.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.102.w3.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.103.w1.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.103.w2.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.103.w3.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.104.w1.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.104.w2.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.104.w3.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.105.w1.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.105.w2.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.105.w3.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.106.w1.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.106.w2.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.106.w3.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.107.w1.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.107.w2.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.107.w3.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.108.w1.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.108.w2.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.108.w3.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.109.w1.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.109.w2.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.109.w3.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.11.w1.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.11.w2.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.11.w3.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.110.w1.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.110.w2.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.110.w3.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.111.w1.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.111.w2.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.111.w3.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.112.w1.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.112.w2.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.112.w3.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.113.w1.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.113.w2.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.113.w3.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.114.w1.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.114.w2.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.114.w3.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.115.w1.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.115.w2.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.115.w3.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.116.w1.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.116.w2.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.116.w3.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.117.w1.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.117.w2.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.117.w3.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.118.w1.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.118.w2.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.118.w3.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.119.w1.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.119.w2.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.119.w3.weight": "consolidated-00252-of-00272.safetensors", + "layers.60.experts.12.w1.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.12.w2.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.12.w3.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.120.w1.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.120.w2.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.120.w3.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.121.w1.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.121.w2.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.121.w3.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.122.w1.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.122.w2.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.122.w3.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.123.w1.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.123.w2.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.123.w3.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.124.w1.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.124.w2.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.124.w3.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.125.w1.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.125.w2.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.125.w3.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.126.w1.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.126.w2.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.126.w3.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.127.w1.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.127.w2.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.127.w3.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.13.w1.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.13.w2.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.13.w3.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.14.w1.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.14.w2.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.14.w3.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.15.w1.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.15.w2.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.15.w3.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.16.w1.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.16.w2.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.16.w3.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.17.w1.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.17.w2.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.17.w3.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.18.w1.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.18.w2.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.18.w3.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.19.w1.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.19.w2.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.19.w3.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.2.w1.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.2.w2.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.2.w3.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.20.w1.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.20.w2.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.20.w3.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.21.w1.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.21.w2.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.21.w3.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.22.w1.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.22.w2.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.22.w3.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.23.w1.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.23.w2.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.23.w3.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.24.w1.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.24.w2.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.24.w3.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.25.w1.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.25.w2.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.25.w3.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.26.w1.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.26.w2.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.26.w3.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.27.w1.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.27.w2.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.27.w3.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.28.w1.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.28.w2.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.28.w3.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.29.w1.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.29.w2.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.29.w3.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.3.w1.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.3.w2.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.3.w3.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.30.w1.weight": "consolidated-00253-of-00272.safetensors", + "layers.60.experts.30.w2.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.30.w3.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.31.w1.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.31.w2.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.31.w3.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.32.w1.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.32.w2.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.32.w3.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.33.w1.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.33.w2.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.33.w3.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.34.w1.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.34.w2.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.34.w3.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.35.w1.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.35.w2.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.35.w3.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.36.w1.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.36.w2.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.36.w3.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.37.w1.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.37.w2.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.37.w3.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.38.w1.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.38.w2.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.38.w3.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.39.w1.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.39.w2.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.39.w3.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.4.w1.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.4.w2.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.4.w3.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.40.w1.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.40.w2.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.40.w3.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.41.w1.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.41.w2.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.41.w3.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.42.w1.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.42.w2.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.42.w3.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.43.w1.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.43.w2.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.43.w3.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.44.w1.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.44.w2.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.44.w3.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.45.w1.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.45.w2.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.45.w3.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.46.w1.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.46.w2.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.46.w3.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.47.w1.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.47.w2.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.47.w3.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.48.w1.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.48.w2.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.48.w3.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.49.w1.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.49.w2.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.49.w3.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.5.w1.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.5.w2.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.5.w3.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.50.w1.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.50.w2.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.50.w3.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.51.w1.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.51.w2.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.51.w3.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.52.w1.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.52.w2.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.52.w3.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.53.w1.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.53.w2.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.53.w3.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.54.w1.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.54.w2.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.54.w3.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.55.w1.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.55.w2.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.55.w3.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.56.w1.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.56.w2.weight": "consolidated-00254-of-00272.safetensors", + "layers.60.experts.56.w3.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.57.w1.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.57.w2.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.57.w3.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.58.w1.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.58.w2.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.58.w3.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.59.w1.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.59.w2.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.59.w3.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.6.w1.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.6.w2.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.6.w3.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.60.w1.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.60.w2.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.60.w3.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.61.w1.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.61.w2.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.61.w3.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.62.w1.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.62.w2.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.62.w3.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.63.w1.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.63.w2.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.63.w3.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.64.w1.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.64.w2.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.64.w3.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.65.w1.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.65.w2.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.65.w3.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.66.w1.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.66.w2.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.66.w3.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.67.w1.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.67.w2.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.67.w3.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.68.w1.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.68.w2.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.68.w3.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.69.w1.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.69.w2.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.69.w3.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.7.w1.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.7.w2.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.7.w3.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.70.w1.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.70.w2.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.70.w3.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.71.w1.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.71.w2.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.71.w3.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.72.w1.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.72.w2.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.72.w3.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.73.w1.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.73.w2.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.73.w3.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.74.w1.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.74.w2.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.74.w3.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.75.w1.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.75.w2.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.75.w3.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.76.w1.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.76.w2.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.76.w3.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.77.w1.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.77.w2.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.77.w3.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.78.w1.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.78.w2.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.78.w3.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.79.w1.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.79.w2.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.79.w3.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.8.w1.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.8.w2.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.8.w3.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.80.w1.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.80.w2.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.80.w3.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.81.w1.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.81.w2.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.81.w3.weight": "consolidated-00255-of-00272.safetensors", + "layers.60.experts.82.w1.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.82.w2.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.82.w3.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.83.w1.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.83.w2.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.83.w3.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.84.w1.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.84.w2.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.84.w3.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.85.w1.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.85.w2.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.85.w3.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.86.w1.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.86.w2.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.86.w3.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.87.w1.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.87.w2.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.87.w3.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.88.w1.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.88.w2.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.88.w3.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.89.w1.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.89.w2.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.89.w3.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.9.w1.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.9.w2.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.9.w3.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.90.w1.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.90.w2.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.90.w3.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.91.w1.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.91.w2.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.91.w3.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.92.w1.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.92.w2.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.92.w3.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.93.w1.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.93.w2.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.93.w3.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.94.w1.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.94.w2.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.94.w3.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.95.w1.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.95.w2.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.95.w3.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.96.w1.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.96.w2.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.96.w3.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.97.w1.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.97.w2.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.97.w3.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.98.w1.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.98.w2.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.98.w3.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.99.w1.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.99.w2.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.experts.99.w3.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.ffn_norm.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.gate.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.shared_experts.w1.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.shared_experts.w2.weight": "consolidated-00256-of-00272.safetensors", + "layers.60.shared_experts.w3.weight": "consolidated-00256-of-00272.safetensors", + "layers.7.attention.kv_a_norm.weight": "consolidated-00256-of-00272.safetensors", + "layers.7.attention.q_a_norm.weight": "consolidated-00256-of-00272.safetensors", + "layers.7.attention.wkv_a_with_mqa.weight": "consolidated-00256-of-00272.safetensors", + "layers.7.attention.wkv_b.weight": "consolidated-00256-of-00272.safetensors", + "layers.7.attention.wo.weight": "consolidated-00256-of-00272.safetensors", + "layers.7.attention.wq_a.weight": "consolidated-00256-of-00272.safetensors", + "layers.7.attention.wq_b.weight": "consolidated-00256-of-00272.safetensors", + "layers.7.attention_norm.weight": "consolidated-00256-of-00272.safetensors", + "layers.7.experts.0.w1.weight": "consolidated-00256-of-00272.safetensors", + "layers.7.experts.0.w2.weight": "consolidated-00256-of-00272.safetensors", + "layers.7.experts.0.w3.weight": "consolidated-00256-of-00272.safetensors", + "layers.7.experts.1.w1.weight": "consolidated-00256-of-00272.safetensors", + "layers.7.experts.1.w2.weight": "consolidated-00256-of-00272.safetensors", + "layers.7.experts.1.w3.weight": "consolidated-00256-of-00272.safetensors", + "layers.7.experts.10.w1.weight": "consolidated-00256-of-00272.safetensors", + "layers.7.experts.10.w2.weight": "consolidated-00256-of-00272.safetensors", + "layers.7.experts.10.w3.weight": "consolidated-00256-of-00272.safetensors", + "layers.7.experts.100.w1.weight": "consolidated-00256-of-00272.safetensors", + "layers.7.experts.100.w2.weight": "consolidated-00256-of-00272.safetensors", + "layers.7.experts.100.w3.weight": "consolidated-00256-of-00272.safetensors", + "layers.7.experts.101.w1.weight": "consolidated-00256-of-00272.safetensors", + "layers.7.experts.101.w2.weight": "consolidated-00256-of-00272.safetensors", + "layers.7.experts.101.w3.weight": "consolidated-00256-of-00272.safetensors", + "layers.7.experts.102.w1.weight": "consolidated-00256-of-00272.safetensors", + "layers.7.experts.102.w2.weight": "consolidated-00256-of-00272.safetensors", + "layers.7.experts.102.w3.weight": "consolidated-00256-of-00272.safetensors", + "layers.7.experts.103.w1.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.103.w2.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.103.w3.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.104.w1.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.104.w2.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.104.w3.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.105.w1.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.105.w2.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.105.w3.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.106.w1.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.106.w2.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.106.w3.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.107.w1.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.107.w2.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.107.w3.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.108.w1.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.108.w2.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.108.w3.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.109.w1.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.109.w2.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.109.w3.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.11.w1.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.11.w2.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.11.w3.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.110.w1.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.110.w2.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.110.w3.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.111.w1.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.111.w2.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.111.w3.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.112.w1.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.112.w2.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.112.w3.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.113.w1.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.113.w2.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.113.w3.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.114.w1.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.114.w2.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.114.w3.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.115.w1.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.115.w2.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.115.w3.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.116.w1.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.116.w2.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.116.w3.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.117.w1.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.117.w2.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.117.w3.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.118.w1.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.118.w2.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.118.w3.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.119.w1.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.119.w2.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.119.w3.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.12.w1.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.12.w2.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.12.w3.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.120.w1.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.120.w2.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.120.w3.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.121.w1.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.121.w2.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.121.w3.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.122.w1.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.122.w2.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.122.w3.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.123.w1.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.123.w2.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.123.w3.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.124.w1.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.124.w2.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.124.w3.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.125.w1.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.125.w2.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.125.w3.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.126.w1.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.126.w2.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.126.w3.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.127.w1.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.127.w2.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.127.w3.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.13.w1.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.13.w2.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.13.w3.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.14.w1.weight": "consolidated-00257-of-00272.safetensors", + "layers.7.experts.14.w2.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.14.w3.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.15.w1.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.15.w2.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.15.w3.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.16.w1.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.16.w2.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.16.w3.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.17.w1.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.17.w2.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.17.w3.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.18.w1.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.18.w2.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.18.w3.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.19.w1.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.19.w2.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.19.w3.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.2.w1.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.2.w2.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.2.w3.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.20.w1.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.20.w2.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.20.w3.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.21.w1.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.21.w2.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.21.w3.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.22.w1.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.22.w2.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.22.w3.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.23.w1.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.23.w2.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.23.w3.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.24.w1.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.24.w2.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.24.w3.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.25.w1.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.25.w2.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.25.w3.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.26.w1.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.26.w2.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.26.w3.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.27.w1.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.27.w2.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.27.w3.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.28.w1.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.28.w2.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.28.w3.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.29.w1.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.29.w2.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.29.w3.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.3.w1.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.3.w2.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.3.w3.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.30.w1.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.30.w2.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.30.w3.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.31.w1.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.31.w2.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.31.w3.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.32.w1.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.32.w2.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.32.w3.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.33.w1.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.33.w2.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.33.w3.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.34.w1.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.34.w2.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.34.w3.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.35.w1.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.35.w2.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.35.w3.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.36.w1.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.36.w2.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.36.w3.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.37.w1.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.37.w2.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.37.w3.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.38.w1.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.38.w2.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.38.w3.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.39.w1.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.39.w2.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.39.w3.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.4.w1.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.4.w2.weight": "consolidated-00258-of-00272.safetensors", + "layers.7.experts.4.w3.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.40.w1.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.40.w2.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.40.w3.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.41.w1.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.41.w2.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.41.w3.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.42.w1.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.42.w2.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.42.w3.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.43.w1.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.43.w2.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.43.w3.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.44.w1.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.44.w2.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.44.w3.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.45.w1.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.45.w2.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.45.w3.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.46.w1.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.46.w2.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.46.w3.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.47.w1.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.47.w2.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.47.w3.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.48.w1.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.48.w2.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.48.w3.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.49.w1.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.49.w2.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.49.w3.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.5.w1.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.5.w2.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.5.w3.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.50.w1.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.50.w2.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.50.w3.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.51.w1.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.51.w2.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.51.w3.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.52.w1.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.52.w2.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.52.w3.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.53.w1.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.53.w2.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.53.w3.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.54.w1.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.54.w2.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.54.w3.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.55.w1.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.55.w2.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.55.w3.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.56.w1.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.56.w2.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.56.w3.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.57.w1.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.57.w2.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.57.w3.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.58.w1.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.58.w2.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.58.w3.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.59.w1.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.59.w2.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.59.w3.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.6.w1.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.6.w2.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.6.w3.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.60.w1.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.60.w2.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.60.w3.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.61.w1.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.61.w2.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.61.w3.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.62.w1.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.62.w2.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.62.w3.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.63.w1.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.63.w2.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.63.w3.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.64.w1.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.64.w2.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.64.w3.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.65.w1.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.65.w2.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.65.w3.weight": "consolidated-00259-of-00272.safetensors", + "layers.7.experts.66.w1.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.66.w2.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.66.w3.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.67.w1.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.67.w2.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.67.w3.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.68.w1.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.68.w2.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.68.w3.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.69.w1.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.69.w2.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.69.w3.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.7.w1.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.7.w2.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.7.w3.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.70.w1.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.70.w2.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.70.w3.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.71.w1.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.71.w2.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.71.w3.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.72.w1.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.72.w2.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.72.w3.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.73.w1.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.73.w2.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.73.w3.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.74.w1.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.74.w2.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.74.w3.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.75.w1.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.75.w2.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.75.w3.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.76.w1.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.76.w2.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.76.w3.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.77.w1.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.77.w2.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.77.w3.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.78.w1.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.78.w2.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.78.w3.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.79.w1.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.79.w2.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.79.w3.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.8.w1.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.8.w2.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.8.w3.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.80.w1.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.80.w2.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.80.w3.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.81.w1.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.81.w2.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.81.w3.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.82.w1.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.82.w2.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.82.w3.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.83.w1.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.83.w2.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.83.w3.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.84.w1.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.84.w2.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.84.w3.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.85.w1.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.85.w2.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.85.w3.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.86.w1.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.86.w2.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.86.w3.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.87.w1.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.87.w2.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.87.w3.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.88.w1.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.88.w2.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.88.w3.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.89.w1.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.89.w2.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.89.w3.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.9.w1.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.9.w2.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.9.w3.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.90.w1.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.90.w2.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.90.w3.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.91.w1.weight": "consolidated-00260-of-00272.safetensors", + "layers.7.experts.91.w2.weight": "consolidated-00261-of-00272.safetensors", + "layers.7.experts.91.w3.weight": "consolidated-00261-of-00272.safetensors", + "layers.7.experts.92.w1.weight": "consolidated-00261-of-00272.safetensors", + "layers.7.experts.92.w2.weight": "consolidated-00261-of-00272.safetensors", + "layers.7.experts.92.w3.weight": "consolidated-00261-of-00272.safetensors", + "layers.7.experts.93.w1.weight": "consolidated-00261-of-00272.safetensors", + "layers.7.experts.93.w2.weight": "consolidated-00261-of-00272.safetensors", + "layers.7.experts.93.w3.weight": "consolidated-00261-of-00272.safetensors", + "layers.7.experts.94.w1.weight": "consolidated-00261-of-00272.safetensors", + "layers.7.experts.94.w2.weight": "consolidated-00261-of-00272.safetensors", + "layers.7.experts.94.w3.weight": "consolidated-00261-of-00272.safetensors", + "layers.7.experts.95.w1.weight": "consolidated-00261-of-00272.safetensors", + "layers.7.experts.95.w2.weight": "consolidated-00261-of-00272.safetensors", + "layers.7.experts.95.w3.weight": "consolidated-00261-of-00272.safetensors", + "layers.7.experts.96.w1.weight": "consolidated-00261-of-00272.safetensors", + "layers.7.experts.96.w2.weight": "consolidated-00261-of-00272.safetensors", + "layers.7.experts.96.w3.weight": "consolidated-00261-of-00272.safetensors", + "layers.7.experts.97.w1.weight": "consolidated-00261-of-00272.safetensors", + "layers.7.experts.97.w2.weight": "consolidated-00261-of-00272.safetensors", + "layers.7.experts.97.w3.weight": "consolidated-00261-of-00272.safetensors", + "layers.7.experts.98.w1.weight": "consolidated-00261-of-00272.safetensors", + "layers.7.experts.98.w2.weight": "consolidated-00261-of-00272.safetensors", + "layers.7.experts.98.w3.weight": "consolidated-00261-of-00272.safetensors", + "layers.7.experts.99.w1.weight": "consolidated-00261-of-00272.safetensors", + "layers.7.experts.99.w2.weight": "consolidated-00261-of-00272.safetensors", + "layers.7.experts.99.w3.weight": "consolidated-00261-of-00272.safetensors", + "layers.7.ffn_norm.weight": "consolidated-00261-of-00272.safetensors", + "layers.7.gate.weight": "consolidated-00261-of-00272.safetensors", + "layers.7.shared_experts.w1.weight": "consolidated-00261-of-00272.safetensors", + "layers.7.shared_experts.w2.weight": "consolidated-00261-of-00272.safetensors", + "layers.7.shared_experts.w3.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.attention.kv_a_norm.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.attention.q_a_norm.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.attention.wkv_a_with_mqa.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.attention.wkv_b.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.attention.wo.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.attention.wq_a.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.attention.wq_b.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.attention_norm.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.0.w1.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.0.w2.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.0.w3.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.1.w1.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.1.w2.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.1.w3.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.10.w1.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.10.w2.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.10.w3.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.100.w1.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.100.w2.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.100.w3.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.101.w1.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.101.w2.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.101.w3.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.102.w1.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.102.w2.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.102.w3.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.103.w1.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.103.w2.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.103.w3.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.104.w1.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.104.w2.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.104.w3.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.105.w1.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.105.w2.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.105.w3.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.106.w1.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.106.w2.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.106.w3.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.107.w1.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.107.w2.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.107.w3.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.108.w1.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.108.w2.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.108.w3.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.109.w1.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.109.w2.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.109.w3.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.11.w1.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.11.w2.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.11.w3.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.110.w1.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.110.w2.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.110.w3.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.111.w1.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.111.w2.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.111.w3.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.112.w1.weight": "consolidated-00261-of-00272.safetensors", + "layers.8.experts.112.w2.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.112.w3.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.113.w1.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.113.w2.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.113.w3.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.114.w1.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.114.w2.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.114.w3.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.115.w1.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.115.w2.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.115.w3.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.116.w1.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.116.w2.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.116.w3.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.117.w1.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.117.w2.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.117.w3.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.118.w1.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.118.w2.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.118.w3.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.119.w1.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.119.w2.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.119.w3.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.12.w1.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.12.w2.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.12.w3.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.120.w1.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.120.w2.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.120.w3.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.121.w1.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.121.w2.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.121.w3.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.122.w1.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.122.w2.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.122.w3.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.123.w1.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.123.w2.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.123.w3.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.124.w1.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.124.w2.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.124.w3.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.125.w1.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.125.w2.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.125.w3.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.126.w1.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.126.w2.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.126.w3.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.127.w1.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.127.w2.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.127.w3.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.13.w1.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.13.w2.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.13.w3.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.14.w1.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.14.w2.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.14.w3.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.15.w1.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.15.w2.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.15.w3.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.16.w1.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.16.w2.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.16.w3.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.17.w1.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.17.w2.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.17.w3.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.18.w1.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.18.w2.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.18.w3.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.19.w1.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.19.w2.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.19.w3.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.2.w1.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.2.w2.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.2.w3.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.20.w1.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.20.w2.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.20.w3.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.21.w1.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.21.w2.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.21.w3.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.22.w1.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.22.w2.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.22.w3.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.23.w1.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.23.w2.weight": "consolidated-00262-of-00272.safetensors", + "layers.8.experts.23.w3.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.24.w1.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.24.w2.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.24.w3.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.25.w1.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.25.w2.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.25.w3.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.26.w1.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.26.w2.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.26.w3.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.27.w1.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.27.w2.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.27.w3.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.28.w1.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.28.w2.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.28.w3.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.29.w1.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.29.w2.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.29.w3.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.3.w1.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.3.w2.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.3.w3.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.30.w1.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.30.w2.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.30.w3.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.31.w1.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.31.w2.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.31.w3.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.32.w1.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.32.w2.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.32.w3.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.33.w1.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.33.w2.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.33.w3.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.34.w1.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.34.w2.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.34.w3.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.35.w1.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.35.w2.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.35.w3.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.36.w1.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.36.w2.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.36.w3.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.37.w1.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.37.w2.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.37.w3.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.38.w1.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.38.w2.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.38.w3.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.39.w1.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.39.w2.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.39.w3.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.4.w1.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.4.w2.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.4.w3.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.40.w1.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.40.w2.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.40.w3.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.41.w1.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.41.w2.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.41.w3.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.42.w1.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.42.w2.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.42.w3.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.43.w1.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.43.w2.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.43.w3.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.44.w1.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.44.w2.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.44.w3.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.45.w1.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.45.w2.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.45.w3.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.46.w1.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.46.w2.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.46.w3.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.47.w1.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.47.w2.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.47.w3.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.48.w1.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.48.w2.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.48.w3.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.49.w1.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.49.w2.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.49.w3.weight": "consolidated-00263-of-00272.safetensors", + "layers.8.experts.5.w1.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.5.w2.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.5.w3.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.50.w1.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.50.w2.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.50.w3.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.51.w1.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.51.w2.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.51.w3.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.52.w1.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.52.w2.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.52.w3.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.53.w1.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.53.w2.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.53.w3.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.54.w1.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.54.w2.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.54.w3.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.55.w1.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.55.w2.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.55.w3.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.56.w1.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.56.w2.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.56.w3.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.57.w1.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.57.w2.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.57.w3.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.58.w1.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.58.w2.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.58.w3.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.59.w1.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.59.w2.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.59.w3.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.6.w1.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.6.w2.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.6.w3.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.60.w1.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.60.w2.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.60.w3.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.61.w1.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.61.w2.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.61.w3.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.62.w1.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.62.w2.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.62.w3.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.63.w1.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.63.w2.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.63.w3.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.64.w1.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.64.w2.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.64.w3.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.65.w1.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.65.w2.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.65.w3.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.66.w1.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.66.w2.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.66.w3.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.67.w1.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.67.w2.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.67.w3.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.68.w1.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.68.w2.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.68.w3.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.69.w1.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.69.w2.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.69.w3.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.7.w1.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.7.w2.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.7.w3.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.70.w1.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.70.w2.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.70.w3.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.71.w1.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.71.w2.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.71.w3.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.72.w1.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.72.w2.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.72.w3.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.73.w1.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.73.w2.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.73.w3.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.74.w1.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.74.w2.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.74.w3.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.75.w1.weight": "consolidated-00264-of-00272.safetensors", + "layers.8.experts.75.w2.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.75.w3.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.76.w1.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.76.w2.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.76.w3.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.77.w1.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.77.w2.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.77.w3.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.78.w1.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.78.w2.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.78.w3.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.79.w1.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.79.w2.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.79.w3.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.8.w1.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.8.w2.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.8.w3.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.80.w1.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.80.w2.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.80.w3.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.81.w1.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.81.w2.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.81.w3.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.82.w1.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.82.w2.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.82.w3.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.83.w1.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.83.w2.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.83.w3.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.84.w1.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.84.w2.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.84.w3.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.85.w1.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.85.w2.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.85.w3.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.86.w1.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.86.w2.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.86.w3.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.87.w1.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.87.w2.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.87.w3.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.88.w1.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.88.w2.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.88.w3.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.89.w1.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.89.w2.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.89.w3.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.9.w1.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.9.w2.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.9.w3.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.90.w1.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.90.w2.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.90.w3.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.91.w1.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.91.w2.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.91.w3.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.92.w1.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.92.w2.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.92.w3.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.93.w1.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.93.w2.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.93.w3.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.94.w1.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.94.w2.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.94.w3.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.95.w1.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.95.w2.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.95.w3.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.96.w1.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.96.w2.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.96.w3.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.97.w1.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.97.w2.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.97.w3.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.98.w1.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.98.w2.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.98.w3.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.99.w1.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.99.w2.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.experts.99.w3.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.ffn_norm.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.gate.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.shared_experts.w1.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.shared_experts.w2.weight": "consolidated-00265-of-00272.safetensors", + "layers.8.shared_experts.w3.weight": "consolidated-00265-of-00272.safetensors", + "layers.9.attention.kv_a_norm.weight": "consolidated-00265-of-00272.safetensors", + "layers.9.attention.q_a_norm.weight": "consolidated-00265-of-00272.safetensors", + "layers.9.attention.wkv_a_with_mqa.weight": "consolidated-00265-of-00272.safetensors", + "layers.9.attention.wkv_b.weight": "consolidated-00265-of-00272.safetensors", + "layers.9.attention.wo.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.attention.wq_a.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.attention.wq_b.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.attention_norm.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.0.w1.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.0.w2.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.0.w3.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.1.w1.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.1.w2.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.1.w3.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.10.w1.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.10.w2.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.10.w3.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.100.w1.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.100.w2.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.100.w3.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.101.w1.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.101.w2.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.101.w3.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.102.w1.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.102.w2.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.102.w3.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.103.w1.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.103.w2.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.103.w3.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.104.w1.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.104.w2.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.104.w3.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.105.w1.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.105.w2.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.105.w3.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.106.w1.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.106.w2.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.106.w3.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.107.w1.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.107.w2.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.107.w3.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.108.w1.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.108.w2.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.108.w3.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.109.w1.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.109.w2.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.109.w3.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.11.w1.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.11.w2.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.11.w3.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.110.w1.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.110.w2.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.110.w3.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.111.w1.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.111.w2.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.111.w3.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.112.w1.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.112.w2.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.112.w3.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.113.w1.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.113.w2.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.113.w3.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.114.w1.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.114.w2.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.114.w3.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.115.w1.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.115.w2.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.115.w3.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.116.w1.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.116.w2.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.116.w3.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.117.w1.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.117.w2.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.117.w3.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.118.w1.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.118.w2.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.118.w3.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.119.w1.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.119.w2.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.119.w3.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.12.w1.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.12.w2.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.12.w3.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.120.w1.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.120.w2.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.120.w3.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.121.w1.weight": "consolidated-00266-of-00272.safetensors", + "layers.9.experts.121.w2.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.121.w3.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.122.w1.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.122.w2.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.122.w3.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.123.w1.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.123.w2.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.123.w3.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.124.w1.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.124.w2.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.124.w3.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.125.w1.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.125.w2.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.125.w3.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.126.w1.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.126.w2.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.126.w3.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.127.w1.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.127.w2.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.127.w3.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.13.w1.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.13.w2.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.13.w3.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.14.w1.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.14.w2.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.14.w3.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.15.w1.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.15.w2.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.15.w3.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.16.w1.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.16.w2.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.16.w3.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.17.w1.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.17.w2.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.17.w3.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.18.w1.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.18.w2.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.18.w3.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.19.w1.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.19.w2.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.19.w3.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.2.w1.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.2.w2.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.2.w3.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.20.w1.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.20.w2.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.20.w3.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.21.w1.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.21.w2.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.21.w3.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.22.w1.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.22.w2.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.22.w3.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.23.w1.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.23.w2.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.23.w3.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.24.w1.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.24.w2.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.24.w3.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.25.w1.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.25.w2.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.25.w3.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.26.w1.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.26.w2.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.26.w3.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.27.w1.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.27.w2.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.27.w3.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.28.w1.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.28.w2.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.28.w3.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.29.w1.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.29.w2.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.29.w3.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.3.w1.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.3.w2.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.3.w3.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.30.w1.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.30.w2.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.30.w3.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.31.w1.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.31.w2.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.31.w3.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.32.w1.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.32.w2.weight": "consolidated-00267-of-00272.safetensors", + "layers.9.experts.32.w3.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.33.w1.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.33.w2.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.33.w3.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.34.w1.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.34.w2.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.34.w3.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.35.w1.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.35.w2.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.35.w3.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.36.w1.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.36.w2.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.36.w3.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.37.w1.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.37.w2.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.37.w3.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.38.w1.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.38.w2.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.38.w3.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.39.w1.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.39.w2.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.39.w3.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.4.w1.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.4.w2.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.4.w3.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.40.w1.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.40.w2.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.40.w3.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.41.w1.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.41.w2.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.41.w3.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.42.w1.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.42.w2.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.42.w3.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.43.w1.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.43.w2.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.43.w3.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.44.w1.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.44.w2.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.44.w3.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.45.w1.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.45.w2.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.45.w3.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.46.w1.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.46.w2.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.46.w3.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.47.w1.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.47.w2.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.47.w3.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.48.w1.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.48.w2.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.48.w3.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.49.w1.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.49.w2.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.49.w3.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.5.w1.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.5.w2.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.5.w3.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.50.w1.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.50.w2.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.50.w3.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.51.w1.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.51.w2.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.51.w3.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.52.w1.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.52.w2.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.52.w3.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.53.w1.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.53.w2.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.53.w3.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.54.w1.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.54.w2.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.54.w3.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.55.w1.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.55.w2.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.55.w3.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.56.w1.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.56.w2.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.56.w3.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.57.w1.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.57.w2.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.57.w3.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.58.w1.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.58.w2.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.58.w3.weight": "consolidated-00268-of-00272.safetensors", + "layers.9.experts.59.w1.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.59.w2.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.59.w3.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.6.w1.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.6.w2.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.6.w3.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.60.w1.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.60.w2.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.60.w3.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.61.w1.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.61.w2.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.61.w3.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.62.w1.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.62.w2.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.62.w3.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.63.w1.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.63.w2.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.63.w3.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.64.w1.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.64.w2.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.64.w3.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.65.w1.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.65.w2.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.65.w3.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.66.w1.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.66.w2.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.66.w3.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.67.w1.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.67.w2.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.67.w3.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.68.w1.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.68.w2.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.68.w3.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.69.w1.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.69.w2.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.69.w3.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.7.w1.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.7.w2.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.7.w3.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.70.w1.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.70.w2.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.70.w3.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.71.w1.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.71.w2.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.71.w3.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.72.w1.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.72.w2.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.72.w3.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.73.w1.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.73.w2.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.73.w3.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.74.w1.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.74.w2.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.74.w3.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.75.w1.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.75.w2.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.75.w3.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.76.w1.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.76.w2.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.76.w3.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.77.w1.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.77.w2.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.77.w3.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.78.w1.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.78.w2.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.78.w3.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.79.w1.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.79.w2.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.79.w3.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.8.w1.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.8.w2.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.8.w3.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.80.w1.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.80.w2.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.80.w3.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.81.w1.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.81.w2.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.81.w3.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.82.w1.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.82.w2.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.82.w3.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.83.w1.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.83.w2.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.83.w3.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.84.w1.weight": "consolidated-00269-of-00272.safetensors", + "layers.9.experts.84.w2.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.84.w3.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.85.w1.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.85.w2.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.85.w3.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.86.w1.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.86.w2.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.86.w3.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.87.w1.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.87.w2.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.87.w3.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.88.w1.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.88.w2.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.88.w3.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.89.w1.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.89.w2.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.89.w3.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.9.w1.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.9.w2.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.9.w3.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.90.w1.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.90.w2.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.90.w3.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.91.w1.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.91.w2.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.91.w3.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.92.w1.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.92.w2.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.92.w3.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.93.w1.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.93.w2.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.93.w3.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.94.w1.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.94.w2.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.94.w3.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.95.w1.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.95.w2.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.95.w3.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.96.w1.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.96.w2.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.96.w3.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.97.w1.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.97.w2.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.97.w3.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.98.w1.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.98.w2.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.98.w3.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.99.w1.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.99.w2.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.experts.99.w3.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.ffn_norm.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.gate.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.shared_experts.w1.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.shared_experts.w2.weight": "consolidated-00270-of-00272.safetensors", + "layers.9.shared_experts.w3.weight": "consolidated-00270-of-00272.safetensors", + "patch_merger.merging_layer.weight": "consolidated-00270-of-00272.safetensors", + "pre_mm_projector_norm.weight": "consolidated-00270-of-00272.safetensors", + "tok_embeddings.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.ln_pre.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.patch_conv.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.0.attention.wk.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.0.attention.wo.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.0.attention.wq.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.0.attention.wv.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.0.attention_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.0.feed_forward.w1.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.0.feed_forward.w2.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.0.feed_forward.w3.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.0.ffn_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.1.attention.wk.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.1.attention.wo.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.1.attention.wq.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.1.attention.wv.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.1.attention_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.1.feed_forward.w1.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.1.feed_forward.w2.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.1.feed_forward.w3.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.1.ffn_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.10.attention.wk.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.10.attention.wo.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.10.attention.wq.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.10.attention.wv.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.10.attention_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.10.feed_forward.w1.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.10.feed_forward.w2.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.10.feed_forward.w3.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.10.ffn_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.11.attention.wk.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.11.attention.wo.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.11.attention.wq.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.11.attention.wv.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.11.attention_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.11.feed_forward.w1.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.11.feed_forward.w2.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.11.feed_forward.w3.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.11.ffn_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.12.attention.wk.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.12.attention.wo.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.12.attention.wq.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.12.attention.wv.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.12.attention_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.12.feed_forward.w1.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.12.feed_forward.w2.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.12.feed_forward.w3.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.12.ffn_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.13.attention.wk.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.13.attention.wo.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.13.attention.wq.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.13.attention.wv.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.13.attention_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.13.feed_forward.w1.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.13.feed_forward.w2.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.13.feed_forward.w3.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.13.ffn_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.14.attention.wk.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.14.attention.wo.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.14.attention.wq.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.14.attention.wv.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.14.attention_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.14.feed_forward.w1.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.14.feed_forward.w2.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.14.feed_forward.w3.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.14.ffn_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.15.attention.wk.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.15.attention.wo.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.15.attention.wq.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.15.attention.wv.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.15.attention_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.15.feed_forward.w1.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.15.feed_forward.w2.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.15.feed_forward.w3.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.15.ffn_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.16.attention.wk.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.16.attention.wo.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.16.attention.wq.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.16.attention.wv.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.16.attention_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.16.feed_forward.w1.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.16.feed_forward.w2.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.16.feed_forward.w3.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.16.ffn_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.17.attention.wk.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.17.attention.wo.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.17.attention.wq.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.17.attention.wv.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.17.attention_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.17.feed_forward.w1.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.17.feed_forward.w2.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.17.feed_forward.w3.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.17.ffn_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.18.attention.wk.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.18.attention.wo.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.18.attention.wq.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.18.attention.wv.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.18.attention_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.18.feed_forward.w1.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.18.feed_forward.w2.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.18.feed_forward.w3.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.18.ffn_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.19.attention.wk.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.19.attention.wo.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.19.attention.wq.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.19.attention.wv.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.19.attention_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.19.feed_forward.w1.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.19.feed_forward.w2.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.19.feed_forward.w3.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.19.ffn_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.2.attention.wk.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.2.attention.wo.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.2.attention.wq.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.2.attention.wv.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.2.attention_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.2.feed_forward.w1.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.2.feed_forward.w2.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.2.feed_forward.w3.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.2.ffn_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.20.attention.wk.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.20.attention.wo.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.20.attention.wq.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.20.attention.wv.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.20.attention_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.20.feed_forward.w1.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.20.feed_forward.w2.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.20.feed_forward.w3.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.20.ffn_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.21.attention.wk.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.21.attention.wo.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.21.attention.wq.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.21.attention.wv.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.21.attention_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.21.feed_forward.w1.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.21.feed_forward.w2.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.21.feed_forward.w3.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.21.ffn_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.22.attention.wk.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.22.attention.wo.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.22.attention.wq.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.22.attention.wv.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.22.attention_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.22.feed_forward.w1.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.22.feed_forward.w2.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.22.feed_forward.w3.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.22.ffn_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.23.attention.wk.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.23.attention.wo.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.23.attention.wq.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.23.attention.wv.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.23.attention_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.23.feed_forward.w1.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.23.feed_forward.w2.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.23.feed_forward.w3.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.23.ffn_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.24.attention.wk.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.24.attention.wo.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.24.attention.wq.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.24.attention.wv.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.24.attention_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.24.feed_forward.w1.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.24.feed_forward.w2.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.24.feed_forward.w3.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.24.ffn_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.25.attention.wk.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.25.attention.wo.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.25.attention.wq.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.25.attention.wv.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.25.attention_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.25.feed_forward.w1.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.25.feed_forward.w2.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.25.feed_forward.w3.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.25.ffn_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.26.attention.wk.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.26.attention.wo.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.26.attention.wq.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.26.attention.wv.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.26.attention_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.26.feed_forward.w1.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.26.feed_forward.w2.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.26.feed_forward.w3.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.26.ffn_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.27.attention.wk.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.27.attention.wo.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.27.attention.wq.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.27.attention.wv.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.27.attention_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.27.feed_forward.w1.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.27.feed_forward.w2.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.27.feed_forward.w3.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.27.ffn_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.28.attention.wk.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.28.attention.wo.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.28.attention.wq.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.28.attention.wv.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.28.attention_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.28.feed_forward.w1.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.28.feed_forward.w2.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.28.feed_forward.w3.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.28.ffn_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.29.attention.wk.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.29.attention.wo.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.29.attention.wq.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.29.attention.wv.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.29.attention_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.29.feed_forward.w1.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.29.feed_forward.w2.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.29.feed_forward.w3.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.29.ffn_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.3.attention.wk.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.3.attention.wo.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.3.attention.wq.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.3.attention.wv.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.3.attention_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.3.feed_forward.w1.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.3.feed_forward.w2.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.3.feed_forward.w3.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.3.ffn_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.30.attention.wk.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.30.attention.wo.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.30.attention.wq.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.30.attention.wv.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.30.attention_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.30.feed_forward.w1.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.30.feed_forward.w2.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.30.feed_forward.w3.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.30.ffn_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.31.attention.wk.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.31.attention.wo.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.31.attention.wq.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.31.attention.wv.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.31.attention_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.31.feed_forward.w1.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.31.feed_forward.w2.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.31.feed_forward.w3.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.31.ffn_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.32.attention.wk.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.32.attention.wo.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.32.attention.wq.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.32.attention.wv.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.32.attention_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.32.feed_forward.w1.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.32.feed_forward.w2.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.32.feed_forward.w3.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.32.ffn_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.33.attention.wk.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.33.attention.wo.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.33.attention.wq.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.33.attention.wv.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.33.attention_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.33.feed_forward.w1.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.33.feed_forward.w2.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.33.feed_forward.w3.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.33.ffn_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.34.attention.wk.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.34.attention.wo.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.34.attention.wq.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.34.attention.wv.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.34.attention_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.34.feed_forward.w1.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.34.feed_forward.w2.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.34.feed_forward.w3.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.34.ffn_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.35.attention.wk.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.35.attention.wo.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.35.attention.wq.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.35.attention.wv.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.35.attention_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.35.feed_forward.w1.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.35.feed_forward.w2.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.35.feed_forward.w3.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.35.ffn_norm.weight": "consolidated-00271-of-00272.safetensors", + "vision_encoder.transformer.layers.36.attention.wk.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.36.attention.wo.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.36.attention.wq.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.36.attention.wv.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.36.attention_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.36.feed_forward.w1.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.36.feed_forward.w2.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.36.feed_forward.w3.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.36.ffn_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.37.attention.wk.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.37.attention.wo.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.37.attention.wq.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.37.attention.wv.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.37.attention_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.37.feed_forward.w1.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.37.feed_forward.w2.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.37.feed_forward.w3.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.37.ffn_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.38.attention.wk.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.38.attention.wo.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.38.attention.wq.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.38.attention.wv.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.38.attention_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.38.feed_forward.w1.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.38.feed_forward.w2.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.38.feed_forward.w3.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.38.ffn_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.39.attention.wk.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.39.attention.wo.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.39.attention.wq.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.39.attention.wv.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.39.attention_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.39.feed_forward.w1.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.39.feed_forward.w2.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.39.feed_forward.w3.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.39.ffn_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.4.attention.wk.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.4.attention.wo.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.4.attention.wq.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.4.attention.wv.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.4.attention_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.4.feed_forward.w1.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.4.feed_forward.w2.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.4.feed_forward.w3.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.4.ffn_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.40.attention.wk.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.40.attention.wo.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.40.attention.wq.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.40.attention.wv.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.40.attention_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.40.feed_forward.w1.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.40.feed_forward.w2.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.40.feed_forward.w3.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.40.ffn_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.41.attention.wk.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.41.attention.wo.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.41.attention.wq.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.41.attention.wv.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.41.attention_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.41.feed_forward.w1.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.41.feed_forward.w2.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.41.feed_forward.w3.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.41.ffn_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.42.attention.wk.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.42.attention.wo.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.42.attention.wq.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.42.attention.wv.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.42.attention_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.42.feed_forward.w1.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.42.feed_forward.w2.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.42.feed_forward.w3.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.42.ffn_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.43.attention.wk.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.43.attention.wo.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.43.attention.wq.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.43.attention.wv.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.43.attention_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.43.feed_forward.w1.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.43.feed_forward.w2.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.43.feed_forward.w3.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.43.ffn_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.44.attention.wk.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.44.attention.wo.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.44.attention.wq.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.44.attention.wv.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.44.attention_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.44.feed_forward.w1.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.44.feed_forward.w2.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.44.feed_forward.w3.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.44.ffn_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.45.attention.wk.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.45.attention.wo.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.45.attention.wq.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.45.attention.wv.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.45.attention_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.45.feed_forward.w1.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.45.feed_forward.w2.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.45.feed_forward.w3.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.45.ffn_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.46.attention.wk.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.46.attention.wo.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.46.attention.wq.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.46.attention.wv.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.46.attention_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.46.feed_forward.w1.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.46.feed_forward.w2.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.46.feed_forward.w3.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.46.ffn_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.47.attention.wk.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.47.attention.wo.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.47.attention.wq.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.47.attention.wv.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.47.attention_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.47.feed_forward.w1.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.47.feed_forward.w2.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.47.feed_forward.w3.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.47.ffn_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.5.attention.wk.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.5.attention.wo.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.5.attention.wq.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.5.attention.wv.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.5.attention_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.5.feed_forward.w1.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.5.feed_forward.w2.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.5.feed_forward.w3.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.5.ffn_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.6.attention.wk.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.6.attention.wo.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.6.attention.wq.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.6.attention.wv.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.6.attention_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.6.feed_forward.w1.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.6.feed_forward.w2.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.6.feed_forward.w3.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.6.ffn_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.7.attention.wk.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.7.attention.wo.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.7.attention.wq.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.7.attention.wv.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.7.attention_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.7.feed_forward.w1.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.7.feed_forward.w2.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.7.feed_forward.w3.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.7.ffn_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.8.attention.wk.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.8.attention.wo.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.8.attention.wq.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.8.attention.wv.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.8.attention_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.8.feed_forward.w1.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.8.feed_forward.w2.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.8.feed_forward.w3.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.8.ffn_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.9.attention.wk.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.9.attention.wo.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.9.attention.wq.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.9.attention.wv.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.9.attention_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.9.feed_forward.w1.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.9.feed_forward.w2.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.9.feed_forward.w3.weight": "consolidated-00272-of-00272.safetensors", + "vision_encoder.transformer.layers.9.ffn_norm.weight": "consolidated-00272-of-00272.safetensors", + "vision_language_adapter.w_in.weight": "consolidated-00272-of-00272.safetensors", + "vision_language_adapter.w_out.weight": "consolidated-00272-of-00272.safetensors", + "norm.weight": "consolidated-00272-of-00272.safetensors", + "output.weight": "consolidated-00272-of-00272.safetensors" + } +} \ No newline at end of file