diff --git a/config.json b/config.json index a8125c63232c99c34f5e10c329416c0f64e1eaa2..983c3035a7770d3579e8d151de499f034d1e2c83 100644 --- a/config.json +++ b/config.json @@ -1,5 +1,5 @@ { - "_name_or_path": "/oe-adapt-default/costah/models/405B_finetune_successful", + "_name_or_path": "/weka/oe-adapt-default/hamishi/405b_dpo_v4", "architectures": [ "LlamaForCausalLM" ], @@ -7,6 +7,7 @@ "attention_dropout": 0.0, "bos_token_id": 128000, "eos_token_id": 128001, + "head_dim": 128, "hidden_act": "silu", "hidden_size": 16384, "initializer_range": 0.02, @@ -29,7 +30,7 @@ "rope_theta": 500000.0, "tie_word_embeddings": false, "torch_dtype": "bfloat16", - "transformers_version": "4.43.4", - "use_cache": true, + "transformers_version": "4.47.1", + "use_cache": false, "vocab_size": 128264 } diff --git a/generation_config.json b/generation_config.json index ddc5a98cd7d8546c217c4812f4fd17279770012e..41de1af1b10386ca8193ae61bdb014263a2402e1 100644 --- a/generation_config.json +++ b/generation_config.json @@ -5,5 +5,5 @@ "eos_token_id": 128001, "temperature": 0.6, "top_p": 0.9, - "transformers_version": "4.43.4" + "transformers_version": "4.47.1" } diff --git a/model-00001-of-00191.safetensors b/model-00001-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e28dc4b54e060bc01f6e58a4dba3d352289da38b --- /dev/null +++ b/model-00001-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0a5c2153dbd137f4878a65a5cfba55dafea83c2266f2388e379232829cd79c7 +size 4806935024 diff --git a/model-00002-of-00191.safetensors b/model-00002-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4320bbb702b1ffb5cde4f1161eb5e91f1f07aa48 --- /dev/null +++ b/model-00002-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e77fe052a1111505a8d5ad3e99505c3a34e11d7bbf85f04a36d0f300680a6ba +size 4026532224 diff --git a/model-00004-of-00191.safetensors b/model-00004-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..35a75932b547cc74e8ee701d834c56d4b1edb480 --- /dev/null +++ b/model-00004-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:551cf09848addf0279b0350e6c256ce0d9f0516e76b539a00696fa9489ed189b +size 4630578112 diff --git a/model-00005-of-00191.safetensors b/model-00005-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6dedb9192587541055412021034e7b745b271c18 --- /dev/null +++ b/model-00005-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84e0aefd62653de5a9d37cada40854ff0fff12ba76662b8f11dd451e89cb40d2 +size 3489661192 diff --git a/model-00007-of-00191.safetensors b/model-00007-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9f003968ca9f7a17ebc5f4c0465f873abe8686dc --- /dev/null +++ b/model-00007-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a39747cb7c2b0ff96140bd2aa5072f82bb2c79c416cbb096354fecb3ad0885b0 +size 4630578112 diff --git a/model-00008-of-00191.safetensors b/model-00008-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c0163a321a35ae24d9caab26d46454bd1afee474 --- /dev/null +++ b/model-00008-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f15b5972f19515effc0ab0f060e7fc05b901e41b9a921f589cf29e6d82d8e93d +size 3489661192 diff --git a/model-00009-of-00191.safetensors b/model-00009-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4ccb93163078cf545224f9a89c6c3f96dbf649bf --- /dev/null +++ b/model-00009-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6412ffe08058fbb7963d2bc3c6ebcc9fe07b2f0935eefbab889d33ae870a2358 +size 4630578112 diff --git a/model-00013-of-00191.safetensors b/model-00013-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9c5c182c65564dae99c796863d66a60f6b4a011b --- /dev/null +++ b/model-00013-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:602fb71a96e108b1f28f7d0b67162ea438ebb0dce7365d1d1434df998f5f9986 +size 4630578112 diff --git a/model-00014-of-00191.safetensors b/model-00014-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..65e01a741ff34b022e1593e4923d25901fe0c6ca --- /dev/null +++ b/model-00014-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a838b9f4f9f5724c91d163e574d5190c6fe7eb44568eca842e510c4e64f366a +size 3489661192 diff --git a/model-00015-of-00191.safetensors b/model-00015-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..18e30211824a804a09c3ded02b32078cec4f4395 --- /dev/null +++ b/model-00015-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebc3a6eb6c3b87bb40c6883e58c6de9f2e67b824d1e31758ac63b7e87a979b4c +size 4630578112 diff --git a/model-00016-of-00191.safetensors b/model-00016-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..182ad622e53cbfc48e871a9a179867ff55edb9ac --- /dev/null +++ b/model-00016-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e50e4d6fb73453e4fdce4a2a1bc1c8f7bb44b2a6283fa744c7f734e5fce51a22 +size 4630578120 diff --git a/model-00017-of-00191.safetensors b/model-00017-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..51456caf865d6fb9253720bbb7d50ed1f9d7f229 --- /dev/null +++ b/model-00017-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:234127f7830d59bace8a4e2e8fc5f276486df68397ffae178e8da65f8691f82e +size 3489661192 diff --git a/model-00019-of-00191.safetensors b/model-00019-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7bb3c9183b94c54096bc8e5b58d7f7abe2370ead --- /dev/null +++ b/model-00019-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71682cca2e0d7659475e5631af48ee48b4f472aa06c4128b1eb81f4ac09ba818 +size 4630578120 diff --git a/model-00020-of-00191.safetensors b/model-00020-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b12616adf5bc39dfa7a500fe60beb15be38db783 --- /dev/null +++ b/model-00020-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd4d7017571ec2c14b945cff22733775876ce053e354fb579b63f2d91db1af66 +size 3489661192 diff --git a/model-00021-of-00191.safetensors b/model-00021-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..53f5f3b5030d8b85e95064212b65832e551f2c8a --- /dev/null +++ b/model-00021-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e958b43e6e61ec6ae8eec43103484dbcbfe5c57f93c0548af4e59abaa5b1bef +size 4630578120 diff --git a/model-00022-of-00191.safetensors b/model-00022-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..de6de82a61796ad8c98fc78219b12ce51a95bf4d --- /dev/null +++ b/model-00022-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37af015863a1aee00b9cf1ef804c262a1c7fff03f55ea078dccbf2f908fc9346 +size 4630578120 diff --git a/model-00023-of-00191.safetensors b/model-00023-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..eb7637bfbace640d373ae832376b7e147d36105e --- /dev/null +++ b/model-00023-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8202ee4b7845428c1ed59346a0f31bf101067e948ebba924849ccd436568780b +size 3489661192 diff --git a/model-00024-of-00191.safetensors b/model-00024-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..132897cae0d5c9f966ad30e4996054d72a6e72fb --- /dev/null +++ b/model-00024-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3181372256f027bde4350f284af42887e4f43047c8bbcd154b42cc00f75eafde +size 4630578120 diff --git a/model-00025-of-00191.safetensors b/model-00025-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cc6643aa68919542b82b42d7978d3f14f7467e50 --- /dev/null +++ b/model-00025-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:157429100e321ff9a70d1a381ce42f927a3db79a60ba5a6693b134160259886f +size 4630578120 diff --git a/model-00026-of-00191.safetensors b/model-00026-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4fae08268d71ebaee550163353c0956daa7f2120 --- /dev/null +++ b/model-00026-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:293a211527d4a303e5136b86ea1d52d70eedd1ffd4c4dccb9381dfc6bb99871c +size 3489661192 diff --git a/model-00027-of-00191.safetensors b/model-00027-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d30d20d9d444ae20f9ee60516d2f684cb75a16d8 --- /dev/null +++ b/model-00027-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef9a65b772c83ba0209c9ba5821277c6b7347e91466404a6e43020b12fabbf54 +size 4630578120 diff --git a/model-00028-of-00191.safetensors b/model-00028-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7247aa21a071a1201b6c5631bcc721c160b553be --- /dev/null +++ b/model-00028-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c1b86db7492bc5dd14379575acfbb7eea24feaa566a27a32dd1f1c7dbdc248a +size 4630578120 diff --git a/model-00029-of-00191.safetensors b/model-00029-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5f6e49e35cbd64878c264bebec6653c9cdbe49c2 --- /dev/null +++ b/model-00029-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75933d94dbacc026a2d54f00c5f4cfabf9c2388f77f96c270389a8b9b8df6d78 +size 3489661192 diff --git a/model-00030-of-00191.safetensors b/model-00030-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5c3f86de685334d0050f82d6e39acc3bcb685be3 --- /dev/null +++ b/model-00030-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c854123f6bb1355108e0bc3510375db0518c9fafd847c5603e42c6f22298bafc +size 4630578120 diff --git a/model-00031-of-00191.safetensors b/model-00031-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..908b1355aded1e5edc5bb5d243eb58fad756898f --- /dev/null +++ b/model-00031-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ab8acbcaf9ec8a9fa99bb6e50c69f675f7cac5d0af4995a937ed8dbab4dd183 +size 4630578120 diff --git a/model-00032-of-00191.safetensors b/model-00032-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..06513c43588ce05ade6dc0b6cb04ff089f3663db --- /dev/null +++ b/model-00032-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa4a8cf325dce210c8ea523d819781a776a139c4ce4d9489c6ac90851ddad569 +size 3489661192 diff --git a/model-00033-of-00191.safetensors b/model-00033-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..583eba74a6b8e8390fbb2ed9c382af9873971ef4 --- /dev/null +++ b/model-00033-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1bea53f2db158f69ccc2997f6101dc7a9d458b91b76c13c50b5765c74943153 +size 4630578120 diff --git a/model-00034-of-00191.safetensors b/model-00034-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f44c3e5a838e550b35781cc2129a0aed7c04c301 --- /dev/null +++ b/model-00034-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36eb0b10d9e0a5bb36fbe8a1681687d905c2165e4a81cd2fb14dfbf3ead9dcac +size 4630578120 diff --git a/model-00035-of-00191.safetensors b/model-00035-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f6160f1c3c42cdf55e5c307657a346a11061899a --- /dev/null +++ b/model-00035-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9aee0c42c487492f696dc3c9fe0ec87b508b0b680d19c6e2dfe9a2560b756e22 +size 3489661192 diff --git a/model-00036-of-00191.safetensors b/model-00036-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fe2cd025def437c02a6e12702000cbfac099ef7a --- /dev/null +++ b/model-00036-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a659b66fe9da3c807b588975231113e6a33dee5c6edd205bfa17c2d654606f5 +size 4630578120 diff --git a/model-00037-of-00191.safetensors b/model-00037-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..56b76c46e95a296af2c5d3e5756912b3544791ec --- /dev/null +++ b/model-00037-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ef26b2c0614ad0d6a615209dce12980a18380c4924d4b429998a12d540438cc +size 4630578120 diff --git a/model-00039-of-00191.safetensors b/model-00039-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..aba09e8cefe831065ac6b3a71d43418e9437c764 --- /dev/null +++ b/model-00039-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6587762b654e498ef6f7c0cfe0d0bf32212aad017eba94923343e7c13feeaeb4 +size 4630578120 diff --git a/model-00040-of-00191.safetensors b/model-00040-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3111858ae6ac39e6104e59694abad58be93b6781 --- /dev/null +++ b/model-00040-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b5fc8f2372d80be0315c4aebb0436d06f2255ec196f5e83b8ffe57b5ad58da8 +size 4630578120 diff --git a/model-00041-of-00191.safetensors b/model-00041-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e8c83750de53236a416daa3272616be06ccce12f --- /dev/null +++ b/model-00041-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03330ddba4a9591e33317c4c21c0766d4f3be3f118f9c48a2398a2206cfc6213 +size 3489661192 diff --git a/model-00042-of-00191.safetensors b/model-00042-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f680754b3271813643e22f4f78bc6e34d2e35c7a --- /dev/null +++ b/model-00042-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37d9d796998425f539c3cc798fd3634e3d86ed34c80c8f1c9a38a3b34dfc630d +size 4630578120 diff --git a/model-00043-of-00191.safetensors b/model-00043-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..57a15e6c1beeb26ae3a52b17ab9d760c69a00f7c --- /dev/null +++ b/model-00043-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e61359b81019551b81d8d57f95e4a8b949dedc8749d10105cce3aa0df6e49bc4 +size 4630578120 diff --git a/model-00044-of-00191.safetensors b/model-00044-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..89122e8962b7dec34502051a280bc4100bc7aedc --- /dev/null +++ b/model-00044-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e91720521b2ad86c3c8915dd568b6dbed3a7db99d7993ee84205e0fa8b08729 +size 3489661192 diff --git a/model-00045-of-00191.safetensors b/model-00045-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..37ac9851ca2e439493719abdc98fce0e77eb202f --- /dev/null +++ b/model-00045-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69c6ee8e5887a8ce02494e2406d890b3b12a1f00af64adba87988384df2f6400 +size 4630578120 diff --git a/model-00046-of-00191.safetensors b/model-00046-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..19ad99534c90d18e53de39d3cc73112e2626f2a5 --- /dev/null +++ b/model-00046-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf7fa5875c1c281648845f7e8861e411cd739603140f8da68f53a5c0c43fb84c +size 4630578120 diff --git a/model-00047-of-00191.safetensors b/model-00047-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..35c23374dc1c93bc0249bbe5d45e7e0b9f6c7c9a --- /dev/null +++ b/model-00047-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f65b4646e145739d9045768b1a050370b663e6165562fb7be46945377397894c +size 3489661192 diff --git a/model-00048-of-00191.safetensors b/model-00048-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7b3805fe663da9107c65a01e929a04935053b7d9 --- /dev/null +++ b/model-00048-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21d41b14c082bf2b55c1ce700c1618a6dad38f2ae0224dce19e1d288c137157f +size 4630578120 diff --git a/model-00049-of-00191.safetensors b/model-00049-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bad7527d0d20da5a96711556d8b55fa08e00e643 --- /dev/null +++ b/model-00049-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e31f48bcc72c250c6d9977bcc2afba7e8e424551eeaac73211efb54394ad83b +size 4630578120 diff --git a/model-00051-of-00191.safetensors b/model-00051-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f2d3a4c359c218751888aa6346d3cf50b113184d --- /dev/null +++ b/model-00051-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c11a6918aeec20eee76d5646981efb4cf31f03720209a3dcd68f51d55999517a +size 4630578120 diff --git a/model-00052-of-00191.safetensors b/model-00052-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e00d3bfadfc5f62688529d2f1e44113881d9bd6c --- /dev/null +++ b/model-00052-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23e7a860438f1b6bb927a4eba058df02e910122d00ecc80f14d3f4c61686f30e +size 4630578120 diff --git a/model-00056-of-00191.safetensors b/model-00056-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0d2658645eab9b11d90cc5f71c4d8ee2cbbb1c29 --- /dev/null +++ b/model-00056-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbe483c26806379909d2ffce560a79a60782d890f410c129c94f888ab34fc575 +size 3489661192 diff --git a/model-00057-of-00191.safetensors b/model-00057-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..098fd1b1ad4ac42504b7bb0449ee770ea92e397e --- /dev/null +++ b/model-00057-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b10866f5f11b03cb5c3c98e776c25c8ceb6596b77c24cdcc207fff88cb66c535 +size 4630578120 diff --git a/model-00059-of-00191.safetensors b/model-00059-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..98bc97ccbcf034dbed248a3a4b4361b60ad25318 --- /dev/null +++ b/model-00059-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03e06a9952279a0a12e7c955b4b8320b7e16f6567db4a14aa9feb786ff2b9882 +size 3489661192 diff --git a/model-00060-of-00191.safetensors b/model-00060-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..021976b77219ef493295feabf86d43a57bc11c73 --- /dev/null +++ b/model-00060-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c47094a83933750a0fe7ac6d9041a74255ac5934255ae1303800bb9b312d0d49 +size 4630578120 diff --git a/model-00061-of-00191.safetensors b/model-00061-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7e36bffd9f4a20844be127ed6cb898456a21caaf --- /dev/null +++ b/model-00061-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26f5766ab69dfb03495300ec3176155a5994d20373d256f6310fc82de3282efe +size 4630578120 diff --git a/model-00062-of-00191.safetensors b/model-00062-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4c4a2b2de4890a8d91c91cc53196f02e51020ba0 --- /dev/null +++ b/model-00062-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16c71a8a64dc0eddab67d6b2247f8ad7df729806541a14a2268f8529023a2b8a +size 3489661192 diff --git a/model-00063-of-00191.safetensors b/model-00063-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..40829cd6ff55c608e4c9b77948bbb37070dec150 --- /dev/null +++ b/model-00063-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7a97f0b95190ccce6065d43779ff859c56aedbe73d0b596de69fe57937e8027 +size 4630578120 diff --git a/model-00064-of-00191.safetensors b/model-00064-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e772392f0f8e2b3b7f7f26b3184e55079c8a34b7 --- /dev/null +++ b/model-00064-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d26cdf540f3b60b8d29fa48c6deee3be161cfbf3fe89568e8d4dd815a25ac5c2 +size 4630578120 diff --git a/model-00065-of-00191.safetensors b/model-00065-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e123be46c02d9d036ef5a9b92e202436b7ba5346 --- /dev/null +++ b/model-00065-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdf133fef12c9393b15153ba5e951d3c6a9f250314415a7d5eff7891e4631231 +size 3489661192 diff --git a/model-00067-of-00191.safetensors b/model-00067-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e9d8c9a678cc344ee804636729621738d71b2350 --- /dev/null +++ b/model-00067-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0d1db47bf631f288934cef5dec8b3d30f30cd1477fe79adb78fa17f22c2eabf +size 4630578120 diff --git a/model-00068-of-00191.safetensors b/model-00068-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6dd33c343ac904629ae84f26e987703052ed4fdd --- /dev/null +++ b/model-00068-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5afc31862605e93c8ddac2ff983a970edbeb72455bb49ade0542479255208c1 +size 3489661192 diff --git a/model-00069-of-00191.safetensors b/model-00069-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f20ae73dd69839f1e8d4d53650e7114664a71ac7 --- /dev/null +++ b/model-00069-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c05b771ec3483f9e29fac5d299d09871547d1bf6b33caeff50b5e0aa2073f05d +size 4630578120 diff --git a/model-00070-of-00191.safetensors b/model-00070-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bce88f976e92d8a0a2197e2d2654eb56e001791c --- /dev/null +++ b/model-00070-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dc22af78c7a11fbc4c1733475106fb31f63ac766b80d274ad9970389950d990 +size 4630578120 diff --git a/model-00071-of-00191.safetensors b/model-00071-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e2f7d51cd771ff931f4cc19e738db92b18f7624c --- /dev/null +++ b/model-00071-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebb585798c6b147a0e531e834feeed1cbf66a28ccc209d4a805953159a71dee5 +size 3489661192 diff --git a/model-00072-of-00191.safetensors b/model-00072-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bbac90f3b2703d3cdac231f90698149b31f39ce3 --- /dev/null +++ b/model-00072-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8457210191cd9ca28353eeba81bdcc3b28be203c846bc3d25cdc64452cf3980d +size 4630578120 diff --git a/model-00075-of-00191.safetensors b/model-00075-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..aae362e26f50c3db0e520e28bc789b826ba5f306 --- /dev/null +++ b/model-00075-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbefcc2154db9e9d058a6c988f53493050fa50787037acc6f60d08cadbed62fc +size 4630578120 diff --git a/model-00076-of-00191.safetensors b/model-00076-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..750391cd7b02f0c9e520f615efb3c4dae4127d01 --- /dev/null +++ b/model-00076-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9d0e67727406685951e17044409d66b82931f754ae107d04253232394861a14 +size 4630578120 diff --git a/model-00077-of-00191.safetensors b/model-00077-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..62e03630671226bb5a7d369c4c9a6e696615e424 --- /dev/null +++ b/model-00077-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c4318f1173c539ae643198bc61560371c75d94aecf04a4729dbf645ea122ad3 +size 3489661192 diff --git a/model-00078-of-00191.safetensors b/model-00078-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9ce8dc371a3956ef3acaf128e5e3c282ca4a5086 --- /dev/null +++ b/model-00078-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c77199b9cfbd416db16440348a9abb999bf3679ecb6824935cbee155a5cc74c5 +size 4630578120 diff --git a/model-00079-of-00191.safetensors b/model-00079-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c2eb47bd6e4417cd1306f0200c7b8e50dce398d8 --- /dev/null +++ b/model-00079-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1472f8f186b6828a6f9df5129036c06e239354a198af0ce4efe2b58020fba94 +size 4630578120 diff --git a/model-00080-of-00191.safetensors b/model-00080-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ac44be935d2c29df3860551209c895cd569d7075 --- /dev/null +++ b/model-00080-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68760cae95525dc587f2eec1bb1bc48ae41d9279bc958a9ed6d35bc2011542e6 +size 3489661192 diff --git a/model-00081-of-00191.safetensors b/model-00081-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ef685a25a2886b85de8593838709c5787ba12066 --- /dev/null +++ b/model-00081-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c78197a53e4105b060121181a363536a7bf16c0cf3de98eb3217e486947a1fb +size 4630578120 diff --git a/model-00082-of-00191.safetensors b/model-00082-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c453a9d0b779d5cf2b24b65a90f98863d11ccf0b --- /dev/null +++ b/model-00082-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac54686eea83432bb925705c29ef2f8ae989bc7a1f5bcaa0d2f44e06da9da03f +size 4630578120 diff --git a/model-00084-of-00191.safetensors b/model-00084-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5b284946d3e7264a57e7ab16cf0c9eada44e5981 --- /dev/null +++ b/model-00084-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9acb52c1f1c8430d20c8df0a93ea99984a9d4908eb1dfe2f93c3a9fd70731f16 +size 4630578120 diff --git a/model-00086-of-00191.safetensors b/model-00086-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0e971b4e135a668c7e49eb456b5ca79868d9afbe --- /dev/null +++ b/model-00086-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8092eb5a30eb2141212f0441d5e8af168e1375ca9eb237c53a45bef65222a1a +size 3489661192 diff --git a/model-00087-of-00191.safetensors b/model-00087-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fb72c52d3cfbd90b5b3dd545ab747d16c65c1a2f --- /dev/null +++ b/model-00087-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0098730dbaa25d2f1a284fafb534ed218cd1bc9f909ced9b1a4e9def13d0787f +size 4630578120 diff --git a/model-00091-of-00191.safetensors b/model-00091-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..db56cbb9376d7f1d48598dbfad153d724364f0dd --- /dev/null +++ b/model-00091-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f28507bd56a2d8d874d3574dd87b2d09a0f1a2e89fc2ea926c582778535ba7e +size 4630578120 diff --git a/model-00093-of-00191.safetensors b/model-00093-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a3c52a8e3a7b2447327401d491f38884c569d702 --- /dev/null +++ b/model-00093-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:750e4eaf10cfb4b7a53a6ee1ec3087aa6fee1b52640d59344b7724184c1d66d3 +size 4630578120 diff --git a/model-00094-of-00191.safetensors b/model-00094-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1608253c8ee6e560f001a0cab06b71ec43b9236c --- /dev/null +++ b/model-00094-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe76d92433135f661f80d12d3d2a0a904ba5d52f4d1a2761f45f40f72abc098f +size 4630578120 diff --git a/model-00095-of-00191.safetensors b/model-00095-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ed82db39d347f6304778c08ff51f814c70d919af --- /dev/null +++ b/model-00095-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29edeba92bdfc258885f4d7e66cc51073c68b93639f7a970ca0ec94cc9ad2981 +size 3489661192 diff --git a/model-00096-of-00191.safetensors b/model-00096-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..94003f8479444283dd19a7465cb561389b6e2c9c --- /dev/null +++ b/model-00096-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f77646d6c62085b3c3b1827969626833da558ac800e1dcbb982eaff37241543 +size 4630578120 diff --git a/model-00098-of-00191.safetensors b/model-00098-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..69b709116f734ceb1ce49c267da7a9a78f3de401 --- /dev/null +++ b/model-00098-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:452d0a81a161646c972ad4ef47fa0910178ccfe45ee0eb43a4d60d26494e685d +size 3489661192 diff --git a/model-00099-of-00191.safetensors b/model-00099-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c1af13eb4a26e43176ba945fe16c3093bdfbda14 --- /dev/null +++ b/model-00099-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6258b575e2af11ff5c24b7a0711899b740ed5cd0b61f63dfdc0dd833e845e32 +size 4630578120 diff --git a/model-00100-of-00191.safetensors b/model-00100-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..553bb79b171a9a9d387fc9bda2be1b35ca9ee75b --- /dev/null +++ b/model-00100-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c43f923f8493f51318f91d4a1274cfdef2b77a0062820e8591c4a85be49e22a6 +size 4630578120 diff --git a/model-00101-of-00191.safetensors b/model-00101-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4ffa2570310f01f7934b1706e680d0ba9c208411 --- /dev/null +++ b/model-00101-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37574208ca93dc46cb0edea273b01cc0047dcb5e693f0d1e46b1f113a523eaac +size 3489661192 diff --git a/model-00102-of-00191.safetensors b/model-00102-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..86b4f18d6c697477ac75d2ae306c84aa2873a106 --- /dev/null +++ b/model-00102-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5f9f4f6626503b0e15148c1060160a92462ea7204ea73a0425af130f9863551 +size 4630578120 diff --git a/model-00104-of-00191.safetensors b/model-00104-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ce083834ee0bbd6fa2ecc0e0004572c60676ed39 --- /dev/null +++ b/model-00104-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f15ee3c37edeb61354ce25d699a47302708c5cf389aab01c1102f261e6859069 +size 3489661192 diff --git a/model-00106-of-00191.safetensors b/model-00106-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dc41c95bcba9a1fb9323ee12f7390c02d896e950 --- /dev/null +++ b/model-00106-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:651db97b3fcd72f7218503406f4717b9ace2781f0c41254460e4b88b0bb4efe5 +size 4630578120 diff --git a/model-00107-of-00191.safetensors b/model-00107-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c013102a8810dde107436f92f43560a330bed526 --- /dev/null +++ b/model-00107-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:773f249ac44b5c382bfadaec92ae6c6b9a3d5228a3db84faeff289f6c8e1a3f7 +size 3489661192 diff --git a/model-00109-of-00191.safetensors b/model-00109-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0310ed85c826810d0ef86bdb99e3b2e07cde6547 --- /dev/null +++ b/model-00109-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5297261c623e613e3c3361c8718a9c8e7b5302a042145793e7ba3f3c24425685 +size 4630578120 diff --git a/model-00110-of-00191.safetensors b/model-00110-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1f4e6f9b304637ed12ed62218c60979216f236fb --- /dev/null +++ b/model-00110-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a1b8314c2f9f6ef79a9d2a5929f2f929abd7b20b95db9d4b5c35d0e86b61cdb +size 3489661192 diff --git a/model-00111-of-00191.safetensors b/model-00111-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..695885feaf0d8f17767cace500b697d275dd04b1 --- /dev/null +++ b/model-00111-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87eb7fe5ae35094094c71a35cc427e37f7f5e6a21c61761fa3e7114b878d18fc +size 4630578120 diff --git a/model-00113-of-00191.safetensors b/model-00113-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..63420cc3eb1b3936efe07fc299c2ec717ffcf86f --- /dev/null +++ b/model-00113-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c204ca7488515a79b04eb1e341a09e22dc8207165a344a199e6b896fac05ca3 +size 3489661192 diff --git a/model-00115-of-00191.safetensors b/model-00115-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..55392dc6af3fe462fc827c123659e4901340e6cf --- /dev/null +++ b/model-00115-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5c8bffc7e52affa634fe462fd983e9e1e87ba5d49ef2f19554573ff9c44a17a +size 4630578120 diff --git a/model-00116-of-00191.safetensors b/model-00116-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..94fb3e7d418b4212993e59971f6b12fcdee6ca0a --- /dev/null +++ b/model-00116-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7398040c7314428e7d45aeaac700385d7919ddf3a9e03f2949ebcd22abeaec3 +size 3489661192 diff --git a/model-00117-of-00191.safetensors b/model-00117-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1a378cd553a2f75f61d38297eaf69d4b85d6d067 --- /dev/null +++ b/model-00117-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de8ddf184c8ce99d4abfe8d4c9d4e17c1aa4d64999877e58ea7a8c50ea45a8c6 +size 4630578120 diff --git a/model-00120-of-00191.safetensors b/model-00120-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dec91ba7e6841745a3f049a623b32275849c73d2 --- /dev/null +++ b/model-00120-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2dbe3ba51555536702fc925c1bad896701b9cae9d1bbb0b02dd413b50e7a077 +size 4630578120 diff --git a/model-00122-of-00191.safetensors b/model-00122-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..17e72b2b5596f18a6696c878d0163593378359ef --- /dev/null +++ b/model-00122-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bee50812b64dcea24262d975478db40f0effb152355583aacbaa6dd30c775ac4 +size 3489661192 diff --git a/model-00123-of-00191.safetensors b/model-00123-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..54949c199f2ea4e0422d9ce7cee73f14eded6523 --- /dev/null +++ b/model-00123-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50e80fb9921075ae69a59eaea7d3f996d556546de8c2caf478c106c7fb95eb22 +size 4630578120 diff --git a/model-00124-of-00191.safetensors b/model-00124-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..11fe72f64fad535e39eb49dde5da1c572f4b5081 --- /dev/null +++ b/model-00124-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:769b1e293dd40a7d652737f7a09ad9446c9afbc983fce8fdf497871e442a256c +size 4630578120 diff --git a/model-00125-of-00191.safetensors b/model-00125-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..58ee0616833c95a7b23b9715a8b9d1782ea38756 --- /dev/null +++ b/model-00125-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e31cdef47e4b1a818a350b76683c6f962c05db0c887f67834fe46677137ecb36 +size 3489661192 diff --git a/model-00126-of-00191.safetensors b/model-00126-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c9fc4deda83c273af6cedf437925410d698acfa0 --- /dev/null +++ b/model-00126-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c0200e7f72beef6ec5f140765c9fb5fd9053463c7b6bd0a387654afc0141c74 +size 4630578120 diff --git a/model-00127-of-00191.safetensors b/model-00127-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2c568a6d628f2515b734d5a241041234662572ba --- /dev/null +++ b/model-00127-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06791ed74a06dce75f8252718602cdfd52d4863d58d078ea47d71dde1aaebf26 +size 4630578120 diff --git a/model-00129-of-00191.safetensors b/model-00129-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..934aae092e8e7b7aa698d47de219f9c3a1dc9804 --- /dev/null +++ b/model-00129-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afe8b41106fa29766d3317693367cb498102e545176ca88497364554bf8651ae +size 4630578120 diff --git a/model-00130-of-00191.safetensors b/model-00130-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3eef65663285fac3656394fab6a72357255dc46c --- /dev/null +++ b/model-00130-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ea0406b473d04eb79174f96e0a38f1fd28f834699facd108089be8f159413fd +size 4630578120 diff --git a/model-00134-of-00191.safetensors b/model-00134-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5e9b469b6c2d831ca2d34df3deb5610d13c29dc8 --- /dev/null +++ b/model-00134-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8eb9fe12a3487fd7248a20473dfbc731ded3b9f83f24fa25311ea34c8171d546 +size 3489661192 diff --git a/model-00135-of-00191.safetensors b/model-00135-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..eb16a4f1eabb48e4371a2514f033198bccf108cb --- /dev/null +++ b/model-00135-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95e023d1c7139423b8b784380bc3e122b4a59e319400f4155b19326335eb5585 +size 4630578120 diff --git a/model-00137-of-00191.safetensors b/model-00137-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..603fb3afa9c8abcc27ff756ffe14df59fb035214 --- /dev/null +++ b/model-00137-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1c5b6d3fe2af1784e6e79cc040ff6913c382b74bca9a41a8e4c9ea3d77536f8 +size 3489661192 diff --git a/model-00138-of-00191.safetensors b/model-00138-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0b8a14f81e69c421e69a4ed467de7d8830ce1154 --- /dev/null +++ b/model-00138-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff5e18017599d9b41fbe7c845fbbb55e125e162fc8285c95a43c507ae808c6d2 +size 4630578120 diff --git a/model-00139-of-00191.safetensors b/model-00139-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..113f50dbbb6cac91e26e91747a9445a49e1c134e --- /dev/null +++ b/model-00139-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:890a35aab86601e0c3897babdfcad9b1c0a7daa3094b2eb4c79c7289ccefdc3b +size 4630578120 diff --git a/model-00140-of-00191.safetensors b/model-00140-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7439d299531bb6feda567a66149c49b460a59154 --- /dev/null +++ b/model-00140-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b846c591775db557dfeecf42e5232fe841a9a66baafab60eb65f47e119737639 +size 3489661192 diff --git a/model-00141-of-00191.safetensors b/model-00141-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..31d17a3f192ad1e30ac874f5864fd144beec1292 --- /dev/null +++ b/model-00141-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ef71638350b48e5431d2aa366bf439fda887697d42968572c487b869eb16198 +size 4630578120 diff --git a/model-00142-of-00191.safetensors b/model-00142-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..88f34714577586860ef2a1ff0df273a378a2dea1 --- /dev/null +++ b/model-00142-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ae497386ca00e677545f4c5325e0a92e761e670aeb2bb02970a64067d93dcdd +size 4630578120 diff --git a/model-00143-of-00191.safetensors b/model-00143-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..db4e8181c524e1b8686cf4e3585489efbfb37d90 --- /dev/null +++ b/model-00143-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7de16c7704b922d9c4c755dd44a507f7a403aeac0b8598aa8930fbf2f108fade +size 3489661192 diff --git a/model-00144-of-00191.safetensors b/model-00144-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..693dc56f424506cdafe53dfd28ad9b96d315f101 --- /dev/null +++ b/model-00144-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bda20547da2f6794f841734046ede1ad4fe60b82b456699ead46afc982ddbc28 +size 4630578120 diff --git a/model-00146-of-00191.safetensors b/model-00146-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..286802b6bb0bfafe66aa8057f136d3a5b6db9852 --- /dev/null +++ b/model-00146-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6b096b0b04c87062185321dc5d13f9d795f26a9520e3219ea9f31ae8f34c48a +size 3489661192 diff --git a/model-00147-of-00191.safetensors b/model-00147-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ee2f1e588ece26d584a26ab0911e481218df2dd8 --- /dev/null +++ b/model-00147-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d8ec6ce84bc11b198f009418574bae32d78d5ce5f9b885a1aaf14b914fe1286 +size 4630578120 diff --git a/model-00148-of-00191.safetensors b/model-00148-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b3370486cd403b551e2161a912a21e738aad5a85 --- /dev/null +++ b/model-00148-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2296674a9686acc7d6c4f32ae2ccdbb7e3e83ff0b0d08ef4ca26458881570e55 +size 4630578120 diff --git a/model-00151-of-00191.safetensors b/model-00151-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5b022c8a440fb9e6f4098aa6d004c28068cf2bdd --- /dev/null +++ b/model-00151-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:944ee7bfe4fc787177892a28c2792eb0cc5e2fc60747601654b087c9fa4ae041 +size 4630578128 diff --git a/model-00153-of-00191.safetensors b/model-00153-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d8b464219852f3f1f6d81424ee6d4f9ee9555546 --- /dev/null +++ b/model-00153-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87c57169c7709a18c0101c01727dbd78b27e3f3b3d3598667d1a10e3f3653bcb +size 4630578128 diff --git a/model-00154-of-00191.safetensors b/model-00154-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3268998e5f4dd9b77649f54c57ea8804fb544e0c --- /dev/null +++ b/model-00154-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62e101871d814a9039b4a6d0678434a83c6c2db96c099d2f9509a77d25982f67 +size 4630578128 diff --git a/model-00156-of-00191.safetensors b/model-00156-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fa17b0b86c706f952e845d40ed1febde96e3d0ff --- /dev/null +++ b/model-00156-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcea6dbdb520fd74559a1dd18eea73301c6f63cf09b04f9b3cda5bceb4f2cc44 +size 4630578128 diff --git a/model-00157-of-00191.safetensors b/model-00157-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..842f591d932ed81fb33c3261cbbbd7aa332f8966 --- /dev/null +++ b/model-00157-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe472487a598361ed297d3fb9b5684114e85a9e3bd0cbb2bd37af1d9f187c0ab +size 4630578128 diff --git a/model-00158-of-00191.safetensors b/model-00158-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..76f6bedc644a1cffac21fa7ea46015eaf40dff32 --- /dev/null +++ b/model-00158-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b60dff6b29d45fe7fa93e627164699ddffabd776451caff5f8beb8387bfa829a +size 3489661200 diff --git a/model-00159-of-00191.safetensors b/model-00159-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a5f8b3de8a980ba98ef1ce61abd75cc4e79428e5 --- /dev/null +++ b/model-00159-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ab6866760e53283fde9f7c9974ff7edd1fbf8d7adb48a61c3625a1a9bafc9d6 +size 4630578128 diff --git a/model-00161-of-00191.safetensors b/model-00161-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4d3a2f1a14d9b94ee9298dfe572bcffe250a9475 --- /dev/null +++ b/model-00161-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7981d47d878ba7f59202687d212ae2140da3af8e09475f105a58ef37447555d +size 3489661200 diff --git a/model-00163-of-00191.safetensors b/model-00163-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f9ebeb4a48a227431d016152c220ae434445a490 --- /dev/null +++ b/model-00163-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3f4aaa537d3f94ccbac67e91b57817e482e9beb5995880c549f49016b7f2ab1 +size 4630578128 diff --git a/model-00165-of-00191.safetensors b/model-00165-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..071a0f2e03abdc4dd64101e62640979bc63591d2 --- /dev/null +++ b/model-00165-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a3e1a920b27016f16060d7ebcf89f6d5ce605fcf4ac47e30222b8036f321eba +size 4630578128 diff --git a/model-00166-of-00191.safetensors b/model-00166-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..05edc4ce0553c201e98a5fd5048d661b030fc62e --- /dev/null +++ b/model-00166-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:232723525465ac190b48ae2d764ce0a95d937c92c24ba6b36b4d274ceb79f2b4 +size 4630578128 diff --git a/model-00167-of-00191.safetensors b/model-00167-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e0dfcf206ade0bcb76b903ab1a12410650d1ceae --- /dev/null +++ b/model-00167-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8142b5fcca7c91b3fc26477d47d6a1fca97b401a35e85f78ec2b6035fd90196b +size 3489661200 diff --git a/model-00168-of-00191.safetensors b/model-00168-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ce28cfb6d840f3636ee066b62494b186e91d4c5d --- /dev/null +++ b/model-00168-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b82046192828ef187c0171d0ad6255d59646ced0fc698707862990d4aea213d1 +size 4630578128 diff --git a/model-00169-of-00191.safetensors b/model-00169-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3009d38aadb5a8907dde54e2a0ca18e77d1216bc --- /dev/null +++ b/model-00169-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49cdac2ce16026d42b3ff05eeb9f04f19b70950c82f4e563f93f4acb2da16280 +size 4630578128 diff --git a/model-00170-of-00191.safetensors b/model-00170-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..120be3f1f8ea9463ea7b8a374a134b5b6bdcbc7f --- /dev/null +++ b/model-00170-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fb236cc1845ceb7d88111112f65a495f43d3e38965c6df8783ec0cd452d3ad8 +size 3489661200 diff --git a/model-00171-of-00191.safetensors b/model-00171-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0eeb2e8e62872a7091bec0260db27028129daccc --- /dev/null +++ b/model-00171-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e02b777633245e7a1d60495669cf57c38124dee4d47655bf6392ca2907083a03 +size 4630578128 diff --git a/model-00172-of-00191.safetensors b/model-00172-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1155efee8f3f39f96f33e91a6cdd6d68a98a01b4 --- /dev/null +++ b/model-00172-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2ca32b2d2a20635cb2b0ee3dd95ff89708f04474b95e9d8a5e56c88ba1ea4b4 +size 4630578128 diff --git a/model-00173-of-00191.safetensors b/model-00173-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..da1037bb23d38133ac5f65b9f6c3d9c8dfa29795 --- /dev/null +++ b/model-00173-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7fd81bf01573734f5fde2c7d7a9e4b05c42d1c9fd1cb842e7c1d9e9cb04fa4e +size 3489661200 diff --git a/model-00175-of-00191.safetensors b/model-00175-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f3016860f46151426f7e79d5e6a2ed7846393b92 --- /dev/null +++ b/model-00175-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcacfc97181aaa9c0836b96a8f8f166625a293ffa0321932cfd7f676895c789e +size 4630578128 diff --git a/model-00176-of-00191.safetensors b/model-00176-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..049be0278825eb1dfd94f320b178431887902d87 --- /dev/null +++ b/model-00176-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15abda21d0bc9bbf9f96b6d2951cb91ec905c6b233b47936e8c1ffa1037b268d +size 3489661200 diff --git a/model-00177-of-00191.safetensors b/model-00177-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0103be694cc989d48dcce3cbd2ce350269c97304 --- /dev/null +++ b/model-00177-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b51a999bb4117de1b58112e9cf903fa1d26b5db8a74c50242f9c458c78526b45 +size 4630578128 diff --git a/model-00179-of-00191.safetensors b/model-00179-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f96dc952e620568eb877b3e8bb4f9c3b997a0934 --- /dev/null +++ b/model-00179-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3ac215e1726a17f47805f19636b9f937406bb1ff5d38951f27604f68c0c37fd +size 3489661200 diff --git a/model-00181-of-00191.safetensors b/model-00181-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e5f1552d589de6eac74075dd959ac6cc69a4fcda --- /dev/null +++ b/model-00181-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d99bbc891c2b3e3bcd98e6400d9b1b3cc97520311d614aebd65cc2522297d959 +size 4630578128 diff --git a/model-00182-of-00191.safetensors b/model-00182-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cf2e513c08937fe249a68a19d663a9acfd947213 --- /dev/null +++ b/model-00182-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a04d06faa94b92a3dc3ecace7550b1332835068d55f99d3aa02704397fd563e +size 3489661200 diff --git a/model-00183-of-00191.safetensors b/model-00183-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a016a52d8fb307d85ffcbafa3748e643faaef70a --- /dev/null +++ b/model-00183-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a5c57cc7c78f31d62cbb2a33670866f058d499327f6db64a35774c64f1af967 +size 4630578128 diff --git a/model-00184-of-00191.safetensors b/model-00184-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..88cb76ec63e8cf793e49917bdd9878e824fa6765 --- /dev/null +++ b/model-00184-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a60ab147335d48859a1513c8d90843fe3f7dcfed55e9c0c0d07adc675f4dd55d +size 4630578128 diff --git a/model-00185-of-00191.safetensors b/model-00185-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..accb15fa16074bf8781450d4401ce870fd63fc5f --- /dev/null +++ b/model-00185-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31aa2c3e679a460c054ab71282c5c0b4518dbbbcffe76531588bd096338b65db +size 3489661200 diff --git a/model-00186-of-00191.safetensors b/model-00186-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ade4884db6611b8853897ee8d5e17cf43b150eea --- /dev/null +++ b/model-00186-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6555e93beb6f41ae21093f1a8c4a2088f1db09b5f90d54cec9a4d6b982b8d29f +size 4630578128 diff --git a/model-00187-of-00191.safetensors b/model-00187-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..25f6b47eb3d711f35fdf9440253f0e1097ab78f6 --- /dev/null +++ b/model-00187-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:778bca572fa56cd63d9f343bcb5e5607cdb48c1264157fd3a029a5bdc2d52e68 +size 4630578128 diff --git a/model-00188-of-00191.safetensors b/model-00188-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cc6b904db90c6a9d6f99c8873f210d0884c10461 --- /dev/null +++ b/model-00188-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3df61957af77f1ad72226e71b6f15bf88e39da086db9fe1406c15ce2fc32ff8f +size 3489661200 diff --git a/model-00189-of-00191.safetensors b/model-00189-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..83191db96a7843d7354f6625bc008acf00c44a8c --- /dev/null +++ b/model-00189-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e1d0f574b8732ca26611ad178c42904bf20ded976b0b0817eec3180163141c0 +size 4630578128 diff --git a/model-00190-of-00191.safetensors b/model-00190-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cc9c9f7daed6a013774a9d449df9caaa62d0f708 --- /dev/null +++ b/model-00190-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8f84088c2901d46abc241325517e9b35d412c2b740c807249ab6e4113c6e462 +size 3489759816 diff --git a/model-00191-of-00191.safetensors b/model-00191-of-00191.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..82cf784192e3662f9b355f67e009a7d7ea3a0f4b --- /dev/null +++ b/model-00191-of-00191.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c2e4187e1b1bf25f455a530fd8f2e90f78e79391ce55400a1a6d9629b30522e +size 4202954880 diff --git a/model.safetensors.index.json b/model.safetensors.index.json new file mode 100644 index 0000000000000000000000000000000000000000..8ce8f051c67b9502bac27d6878d78e0f889ef291 --- /dev/null +++ b/model.safetensors.index.json @@ -0,0 +1,1144 @@ +{ + "metadata": { + "total_size": 811707301888 + }, + "weight_map": { + "lm_head.weight": "model-00191-of-00191.safetensors", + "model.embed_tokens.weight": "model-00001-of-00191.safetensors", + "model.layers.0.input_layernorm.weight": "model-00003-of-00191.safetensors", + "model.layers.0.mlp.down_proj.weight": "model-00003-of-00191.safetensors", + "model.layers.0.mlp.gate_proj.weight": "model-00002-of-00191.safetensors", + "model.layers.0.mlp.up_proj.weight": "model-00002-of-00191.safetensors", + "model.layers.0.post_attention_layernorm.weight": "model-00003-of-00191.safetensors", + "model.layers.0.self_attn.k_proj.weight": "model-00001-of-00191.safetensors", + "model.layers.0.self_attn.o_proj.weight": "model-00002-of-00191.safetensors", + "model.layers.0.self_attn.q_proj.weight": "model-00001-of-00191.safetensors", + "model.layers.0.self_attn.v_proj.weight": "model-00001-of-00191.safetensors", + "model.layers.1.input_layernorm.weight": "model-00004-of-00191.safetensors", + "model.layers.1.mlp.down_proj.weight": "model-00004-of-00191.safetensors", + "model.layers.1.mlp.gate_proj.weight": "model-00003-of-00191.safetensors", + "model.layers.1.mlp.up_proj.weight": "model-00004-of-00191.safetensors", + "model.layers.1.post_attention_layernorm.weight": "model-00004-of-00191.safetensors", + "model.layers.1.self_attn.k_proj.weight": "model-00003-of-00191.safetensors", + "model.layers.1.self_attn.o_proj.weight": "model-00003-of-00191.safetensors", + "model.layers.1.self_attn.q_proj.weight": "model-00003-of-00191.safetensors", + "model.layers.1.self_attn.v_proj.weight": "model-00003-of-00191.safetensors", + "model.layers.10.input_layernorm.weight": "model-00018-of-00191.safetensors", + "model.layers.10.mlp.down_proj.weight": "model-00018-of-00191.safetensors", + "model.layers.10.mlp.gate_proj.weight": "model-00017-of-00191.safetensors", + "model.layers.10.mlp.up_proj.weight": "model-00017-of-00191.safetensors", + "model.layers.10.post_attention_layernorm.weight": "model-00018-of-00191.safetensors", + "model.layers.10.self_attn.k_proj.weight": "model-00016-of-00191.safetensors", + "model.layers.10.self_attn.o_proj.weight": "model-00016-of-00191.safetensors", + "model.layers.10.self_attn.q_proj.weight": "model-00016-of-00191.safetensors", + "model.layers.10.self_attn.v_proj.weight": "model-00016-of-00191.safetensors", + "model.layers.100.input_layernorm.weight": "model-00153-of-00191.safetensors", + "model.layers.100.mlp.down_proj.weight": "model-00153-of-00191.safetensors", + "model.layers.100.mlp.gate_proj.weight": "model-00152-of-00191.safetensors", + "model.layers.100.mlp.up_proj.weight": "model-00152-of-00191.safetensors", + "model.layers.100.post_attention_layernorm.weight": "model-00153-of-00191.safetensors", + "model.layers.100.self_attn.k_proj.weight": "model-00151-of-00191.safetensors", + "model.layers.100.self_attn.o_proj.weight": "model-00151-of-00191.safetensors", + "model.layers.100.self_attn.q_proj.weight": "model-00151-of-00191.safetensors", + "model.layers.100.self_attn.v_proj.weight": "model-00151-of-00191.safetensors", + "model.layers.101.input_layernorm.weight": "model-00154-of-00191.safetensors", + "model.layers.101.mlp.down_proj.weight": "model-00154-of-00191.safetensors", + "model.layers.101.mlp.gate_proj.weight": "model-00153-of-00191.safetensors", + "model.layers.101.mlp.up_proj.weight": "model-00154-of-00191.safetensors", + "model.layers.101.post_attention_layernorm.weight": "model-00154-of-00191.safetensors", + "model.layers.101.self_attn.k_proj.weight": "model-00153-of-00191.safetensors", + "model.layers.101.self_attn.o_proj.weight": "model-00153-of-00191.safetensors", + "model.layers.101.self_attn.q_proj.weight": "model-00153-of-00191.safetensors", + "model.layers.101.self_attn.v_proj.weight": "model-00153-of-00191.safetensors", + "model.layers.102.input_layernorm.weight": "model-00156-of-00191.safetensors", + "model.layers.102.mlp.down_proj.weight": "model-00156-of-00191.safetensors", + "model.layers.102.mlp.gate_proj.weight": "model-00155-of-00191.safetensors", + "model.layers.102.mlp.up_proj.weight": "model-00155-of-00191.safetensors", + "model.layers.102.post_attention_layernorm.weight": "model-00156-of-00191.safetensors", + "model.layers.102.self_attn.k_proj.weight": "model-00154-of-00191.safetensors", + "model.layers.102.self_attn.o_proj.weight": "model-00154-of-00191.safetensors", + "model.layers.102.self_attn.q_proj.weight": "model-00154-of-00191.safetensors", + "model.layers.102.self_attn.v_proj.weight": "model-00154-of-00191.safetensors", + "model.layers.103.input_layernorm.weight": "model-00157-of-00191.safetensors", + "model.layers.103.mlp.down_proj.weight": "model-00157-of-00191.safetensors", + "model.layers.103.mlp.gate_proj.weight": "model-00156-of-00191.safetensors", + "model.layers.103.mlp.up_proj.weight": "model-00157-of-00191.safetensors", + "model.layers.103.post_attention_layernorm.weight": "model-00157-of-00191.safetensors", + "model.layers.103.self_attn.k_proj.weight": "model-00156-of-00191.safetensors", + "model.layers.103.self_attn.o_proj.weight": "model-00156-of-00191.safetensors", + "model.layers.103.self_attn.q_proj.weight": "model-00156-of-00191.safetensors", + "model.layers.103.self_attn.v_proj.weight": "model-00156-of-00191.safetensors", + "model.layers.104.input_layernorm.weight": "model-00159-of-00191.safetensors", + "model.layers.104.mlp.down_proj.weight": "model-00159-of-00191.safetensors", + "model.layers.104.mlp.gate_proj.weight": "model-00158-of-00191.safetensors", + "model.layers.104.mlp.up_proj.weight": "model-00158-of-00191.safetensors", + "model.layers.104.post_attention_layernorm.weight": "model-00159-of-00191.safetensors", + "model.layers.104.self_attn.k_proj.weight": "model-00157-of-00191.safetensors", + "model.layers.104.self_attn.o_proj.weight": "model-00157-of-00191.safetensors", + "model.layers.104.self_attn.q_proj.weight": "model-00157-of-00191.safetensors", + "model.layers.104.self_attn.v_proj.weight": "model-00157-of-00191.safetensors", + "model.layers.105.input_layernorm.weight": "model-00160-of-00191.safetensors", + "model.layers.105.mlp.down_proj.weight": "model-00160-of-00191.safetensors", + "model.layers.105.mlp.gate_proj.weight": "model-00159-of-00191.safetensors", + "model.layers.105.mlp.up_proj.weight": "model-00160-of-00191.safetensors", + "model.layers.105.post_attention_layernorm.weight": "model-00160-of-00191.safetensors", + "model.layers.105.self_attn.k_proj.weight": "model-00159-of-00191.safetensors", + "model.layers.105.self_attn.o_proj.weight": "model-00159-of-00191.safetensors", + "model.layers.105.self_attn.q_proj.weight": "model-00159-of-00191.safetensors", + "model.layers.105.self_attn.v_proj.weight": "model-00159-of-00191.safetensors", + "model.layers.106.input_layernorm.weight": "model-00162-of-00191.safetensors", + "model.layers.106.mlp.down_proj.weight": "model-00162-of-00191.safetensors", + "model.layers.106.mlp.gate_proj.weight": "model-00161-of-00191.safetensors", + "model.layers.106.mlp.up_proj.weight": "model-00161-of-00191.safetensors", + "model.layers.106.post_attention_layernorm.weight": "model-00162-of-00191.safetensors", + "model.layers.106.self_attn.k_proj.weight": "model-00160-of-00191.safetensors", + "model.layers.106.self_attn.o_proj.weight": "model-00160-of-00191.safetensors", + "model.layers.106.self_attn.q_proj.weight": "model-00160-of-00191.safetensors", + "model.layers.106.self_attn.v_proj.weight": "model-00160-of-00191.safetensors", + "model.layers.107.input_layernorm.weight": "model-00163-of-00191.safetensors", + "model.layers.107.mlp.down_proj.weight": "model-00163-of-00191.safetensors", + "model.layers.107.mlp.gate_proj.weight": "model-00162-of-00191.safetensors", + "model.layers.107.mlp.up_proj.weight": "model-00163-of-00191.safetensors", + "model.layers.107.post_attention_layernorm.weight": "model-00163-of-00191.safetensors", + "model.layers.107.self_attn.k_proj.weight": "model-00162-of-00191.safetensors", + "model.layers.107.self_attn.o_proj.weight": "model-00162-of-00191.safetensors", + "model.layers.107.self_attn.q_proj.weight": "model-00162-of-00191.safetensors", + "model.layers.107.self_attn.v_proj.weight": "model-00162-of-00191.safetensors", + "model.layers.108.input_layernorm.weight": "model-00165-of-00191.safetensors", + "model.layers.108.mlp.down_proj.weight": "model-00165-of-00191.safetensors", + "model.layers.108.mlp.gate_proj.weight": "model-00164-of-00191.safetensors", + "model.layers.108.mlp.up_proj.weight": "model-00164-of-00191.safetensors", + "model.layers.108.post_attention_layernorm.weight": "model-00165-of-00191.safetensors", + "model.layers.108.self_attn.k_proj.weight": "model-00163-of-00191.safetensors", + "model.layers.108.self_attn.o_proj.weight": "model-00163-of-00191.safetensors", + "model.layers.108.self_attn.q_proj.weight": "model-00163-of-00191.safetensors", + "model.layers.108.self_attn.v_proj.weight": "model-00163-of-00191.safetensors", + "model.layers.109.input_layernorm.weight": "model-00166-of-00191.safetensors", + "model.layers.109.mlp.down_proj.weight": "model-00166-of-00191.safetensors", + "model.layers.109.mlp.gate_proj.weight": "model-00165-of-00191.safetensors", + "model.layers.109.mlp.up_proj.weight": "model-00166-of-00191.safetensors", + "model.layers.109.post_attention_layernorm.weight": "model-00166-of-00191.safetensors", + "model.layers.109.self_attn.k_proj.weight": "model-00165-of-00191.safetensors", + "model.layers.109.self_attn.o_proj.weight": "model-00165-of-00191.safetensors", + "model.layers.109.self_attn.q_proj.weight": "model-00165-of-00191.safetensors", + "model.layers.109.self_attn.v_proj.weight": "model-00165-of-00191.safetensors", + "model.layers.11.input_layernorm.weight": "model-00019-of-00191.safetensors", + "model.layers.11.mlp.down_proj.weight": "model-00019-of-00191.safetensors", + "model.layers.11.mlp.gate_proj.weight": "model-00018-of-00191.safetensors", + "model.layers.11.mlp.up_proj.weight": "model-00019-of-00191.safetensors", + "model.layers.11.post_attention_layernorm.weight": "model-00019-of-00191.safetensors", + "model.layers.11.self_attn.k_proj.weight": "model-00018-of-00191.safetensors", + "model.layers.11.self_attn.o_proj.weight": "model-00018-of-00191.safetensors", + "model.layers.11.self_attn.q_proj.weight": "model-00018-of-00191.safetensors", + "model.layers.11.self_attn.v_proj.weight": "model-00018-of-00191.safetensors", + "model.layers.110.input_layernorm.weight": "model-00168-of-00191.safetensors", + "model.layers.110.mlp.down_proj.weight": "model-00168-of-00191.safetensors", + "model.layers.110.mlp.gate_proj.weight": "model-00167-of-00191.safetensors", + "model.layers.110.mlp.up_proj.weight": "model-00167-of-00191.safetensors", + "model.layers.110.post_attention_layernorm.weight": "model-00168-of-00191.safetensors", + "model.layers.110.self_attn.k_proj.weight": "model-00166-of-00191.safetensors", + "model.layers.110.self_attn.o_proj.weight": "model-00166-of-00191.safetensors", + "model.layers.110.self_attn.q_proj.weight": "model-00166-of-00191.safetensors", + "model.layers.110.self_attn.v_proj.weight": "model-00166-of-00191.safetensors", + "model.layers.111.input_layernorm.weight": "model-00169-of-00191.safetensors", + "model.layers.111.mlp.down_proj.weight": "model-00169-of-00191.safetensors", + "model.layers.111.mlp.gate_proj.weight": "model-00168-of-00191.safetensors", + "model.layers.111.mlp.up_proj.weight": "model-00169-of-00191.safetensors", + "model.layers.111.post_attention_layernorm.weight": "model-00169-of-00191.safetensors", + "model.layers.111.self_attn.k_proj.weight": "model-00168-of-00191.safetensors", + "model.layers.111.self_attn.o_proj.weight": "model-00168-of-00191.safetensors", + "model.layers.111.self_attn.q_proj.weight": "model-00168-of-00191.safetensors", + "model.layers.111.self_attn.v_proj.weight": "model-00168-of-00191.safetensors", + "model.layers.112.input_layernorm.weight": "model-00171-of-00191.safetensors", + "model.layers.112.mlp.down_proj.weight": "model-00171-of-00191.safetensors", + "model.layers.112.mlp.gate_proj.weight": "model-00170-of-00191.safetensors", + "model.layers.112.mlp.up_proj.weight": "model-00170-of-00191.safetensors", + "model.layers.112.post_attention_layernorm.weight": "model-00171-of-00191.safetensors", + "model.layers.112.self_attn.k_proj.weight": "model-00169-of-00191.safetensors", + "model.layers.112.self_attn.o_proj.weight": "model-00169-of-00191.safetensors", + "model.layers.112.self_attn.q_proj.weight": "model-00169-of-00191.safetensors", + "model.layers.112.self_attn.v_proj.weight": "model-00169-of-00191.safetensors", + "model.layers.113.input_layernorm.weight": "model-00172-of-00191.safetensors", + "model.layers.113.mlp.down_proj.weight": "model-00172-of-00191.safetensors", + "model.layers.113.mlp.gate_proj.weight": "model-00171-of-00191.safetensors", + "model.layers.113.mlp.up_proj.weight": "model-00172-of-00191.safetensors", + "model.layers.113.post_attention_layernorm.weight": "model-00172-of-00191.safetensors", + "model.layers.113.self_attn.k_proj.weight": "model-00171-of-00191.safetensors", + "model.layers.113.self_attn.o_proj.weight": "model-00171-of-00191.safetensors", + "model.layers.113.self_attn.q_proj.weight": "model-00171-of-00191.safetensors", + "model.layers.113.self_attn.v_proj.weight": "model-00171-of-00191.safetensors", + "model.layers.114.input_layernorm.weight": "model-00174-of-00191.safetensors", + "model.layers.114.mlp.down_proj.weight": "model-00174-of-00191.safetensors", + "model.layers.114.mlp.gate_proj.weight": "model-00173-of-00191.safetensors", + "model.layers.114.mlp.up_proj.weight": "model-00173-of-00191.safetensors", + "model.layers.114.post_attention_layernorm.weight": "model-00174-of-00191.safetensors", + "model.layers.114.self_attn.k_proj.weight": "model-00172-of-00191.safetensors", + "model.layers.114.self_attn.o_proj.weight": "model-00172-of-00191.safetensors", + "model.layers.114.self_attn.q_proj.weight": "model-00172-of-00191.safetensors", + "model.layers.114.self_attn.v_proj.weight": "model-00172-of-00191.safetensors", + "model.layers.115.input_layernorm.weight": "model-00175-of-00191.safetensors", + "model.layers.115.mlp.down_proj.weight": "model-00175-of-00191.safetensors", + "model.layers.115.mlp.gate_proj.weight": "model-00174-of-00191.safetensors", + "model.layers.115.mlp.up_proj.weight": "model-00175-of-00191.safetensors", + "model.layers.115.post_attention_layernorm.weight": "model-00175-of-00191.safetensors", + "model.layers.115.self_attn.k_proj.weight": "model-00174-of-00191.safetensors", + "model.layers.115.self_attn.o_proj.weight": "model-00174-of-00191.safetensors", + "model.layers.115.self_attn.q_proj.weight": "model-00174-of-00191.safetensors", + "model.layers.115.self_attn.v_proj.weight": "model-00174-of-00191.safetensors", + "model.layers.116.input_layernorm.weight": "model-00177-of-00191.safetensors", + "model.layers.116.mlp.down_proj.weight": "model-00177-of-00191.safetensors", + "model.layers.116.mlp.gate_proj.weight": "model-00176-of-00191.safetensors", + "model.layers.116.mlp.up_proj.weight": "model-00176-of-00191.safetensors", + "model.layers.116.post_attention_layernorm.weight": "model-00177-of-00191.safetensors", + "model.layers.116.self_attn.k_proj.weight": "model-00175-of-00191.safetensors", + "model.layers.116.self_attn.o_proj.weight": "model-00175-of-00191.safetensors", + "model.layers.116.self_attn.q_proj.weight": "model-00175-of-00191.safetensors", + "model.layers.116.self_attn.v_proj.weight": "model-00175-of-00191.safetensors", + "model.layers.117.input_layernorm.weight": "model-00178-of-00191.safetensors", + "model.layers.117.mlp.down_proj.weight": "model-00178-of-00191.safetensors", + "model.layers.117.mlp.gate_proj.weight": "model-00177-of-00191.safetensors", + "model.layers.117.mlp.up_proj.weight": "model-00178-of-00191.safetensors", + "model.layers.117.post_attention_layernorm.weight": "model-00178-of-00191.safetensors", + "model.layers.117.self_attn.k_proj.weight": "model-00177-of-00191.safetensors", + "model.layers.117.self_attn.o_proj.weight": "model-00177-of-00191.safetensors", + "model.layers.117.self_attn.q_proj.weight": "model-00177-of-00191.safetensors", + "model.layers.117.self_attn.v_proj.weight": "model-00177-of-00191.safetensors", + "model.layers.118.input_layernorm.weight": "model-00180-of-00191.safetensors", + "model.layers.118.mlp.down_proj.weight": "model-00180-of-00191.safetensors", + "model.layers.118.mlp.gate_proj.weight": "model-00179-of-00191.safetensors", + "model.layers.118.mlp.up_proj.weight": "model-00179-of-00191.safetensors", + "model.layers.118.post_attention_layernorm.weight": "model-00180-of-00191.safetensors", + "model.layers.118.self_attn.k_proj.weight": "model-00178-of-00191.safetensors", + "model.layers.118.self_attn.o_proj.weight": "model-00178-of-00191.safetensors", + "model.layers.118.self_attn.q_proj.weight": "model-00178-of-00191.safetensors", + "model.layers.118.self_attn.v_proj.weight": "model-00178-of-00191.safetensors", + "model.layers.119.input_layernorm.weight": "model-00181-of-00191.safetensors", + "model.layers.119.mlp.down_proj.weight": "model-00181-of-00191.safetensors", + "model.layers.119.mlp.gate_proj.weight": "model-00180-of-00191.safetensors", + "model.layers.119.mlp.up_proj.weight": "model-00181-of-00191.safetensors", + "model.layers.119.post_attention_layernorm.weight": "model-00181-of-00191.safetensors", + "model.layers.119.self_attn.k_proj.weight": "model-00180-of-00191.safetensors", + "model.layers.119.self_attn.o_proj.weight": "model-00180-of-00191.safetensors", + "model.layers.119.self_attn.q_proj.weight": "model-00180-of-00191.safetensors", + "model.layers.119.self_attn.v_proj.weight": "model-00180-of-00191.safetensors", + "model.layers.12.input_layernorm.weight": "model-00021-of-00191.safetensors", + "model.layers.12.mlp.down_proj.weight": "model-00021-of-00191.safetensors", + "model.layers.12.mlp.gate_proj.weight": "model-00020-of-00191.safetensors", + "model.layers.12.mlp.up_proj.weight": "model-00020-of-00191.safetensors", + "model.layers.12.post_attention_layernorm.weight": "model-00021-of-00191.safetensors", + "model.layers.12.self_attn.k_proj.weight": "model-00019-of-00191.safetensors", + "model.layers.12.self_attn.o_proj.weight": "model-00019-of-00191.safetensors", + "model.layers.12.self_attn.q_proj.weight": "model-00019-of-00191.safetensors", + "model.layers.12.self_attn.v_proj.weight": "model-00019-of-00191.safetensors", + "model.layers.120.input_layernorm.weight": "model-00183-of-00191.safetensors", + "model.layers.120.mlp.down_proj.weight": "model-00183-of-00191.safetensors", + "model.layers.120.mlp.gate_proj.weight": "model-00182-of-00191.safetensors", + "model.layers.120.mlp.up_proj.weight": "model-00182-of-00191.safetensors", + "model.layers.120.post_attention_layernorm.weight": "model-00183-of-00191.safetensors", + "model.layers.120.self_attn.k_proj.weight": "model-00181-of-00191.safetensors", + "model.layers.120.self_attn.o_proj.weight": "model-00181-of-00191.safetensors", + "model.layers.120.self_attn.q_proj.weight": "model-00181-of-00191.safetensors", + "model.layers.120.self_attn.v_proj.weight": "model-00181-of-00191.safetensors", + "model.layers.121.input_layernorm.weight": "model-00184-of-00191.safetensors", + "model.layers.121.mlp.down_proj.weight": "model-00184-of-00191.safetensors", + "model.layers.121.mlp.gate_proj.weight": "model-00183-of-00191.safetensors", + "model.layers.121.mlp.up_proj.weight": "model-00184-of-00191.safetensors", + "model.layers.121.post_attention_layernorm.weight": "model-00184-of-00191.safetensors", + "model.layers.121.self_attn.k_proj.weight": "model-00183-of-00191.safetensors", + "model.layers.121.self_attn.o_proj.weight": "model-00183-of-00191.safetensors", + "model.layers.121.self_attn.q_proj.weight": "model-00183-of-00191.safetensors", + "model.layers.121.self_attn.v_proj.weight": "model-00183-of-00191.safetensors", + "model.layers.122.input_layernorm.weight": "model-00186-of-00191.safetensors", + "model.layers.122.mlp.down_proj.weight": "model-00186-of-00191.safetensors", + "model.layers.122.mlp.gate_proj.weight": "model-00185-of-00191.safetensors", + "model.layers.122.mlp.up_proj.weight": "model-00185-of-00191.safetensors", + "model.layers.122.post_attention_layernorm.weight": "model-00186-of-00191.safetensors", + "model.layers.122.self_attn.k_proj.weight": "model-00184-of-00191.safetensors", + "model.layers.122.self_attn.o_proj.weight": "model-00184-of-00191.safetensors", + "model.layers.122.self_attn.q_proj.weight": "model-00184-of-00191.safetensors", + "model.layers.122.self_attn.v_proj.weight": "model-00184-of-00191.safetensors", + "model.layers.123.input_layernorm.weight": "model-00187-of-00191.safetensors", + "model.layers.123.mlp.down_proj.weight": "model-00187-of-00191.safetensors", + "model.layers.123.mlp.gate_proj.weight": "model-00186-of-00191.safetensors", + "model.layers.123.mlp.up_proj.weight": "model-00187-of-00191.safetensors", + "model.layers.123.post_attention_layernorm.weight": "model-00187-of-00191.safetensors", + "model.layers.123.self_attn.k_proj.weight": "model-00186-of-00191.safetensors", + "model.layers.123.self_attn.o_proj.weight": "model-00186-of-00191.safetensors", + "model.layers.123.self_attn.q_proj.weight": "model-00186-of-00191.safetensors", + "model.layers.123.self_attn.v_proj.weight": "model-00186-of-00191.safetensors", + "model.layers.124.input_layernorm.weight": "model-00189-of-00191.safetensors", + "model.layers.124.mlp.down_proj.weight": "model-00189-of-00191.safetensors", + "model.layers.124.mlp.gate_proj.weight": "model-00188-of-00191.safetensors", + "model.layers.124.mlp.up_proj.weight": "model-00188-of-00191.safetensors", + "model.layers.124.post_attention_layernorm.weight": "model-00189-of-00191.safetensors", + "model.layers.124.self_attn.k_proj.weight": "model-00187-of-00191.safetensors", + "model.layers.124.self_attn.o_proj.weight": "model-00187-of-00191.safetensors", + "model.layers.124.self_attn.q_proj.weight": "model-00187-of-00191.safetensors", + "model.layers.124.self_attn.v_proj.weight": "model-00187-of-00191.safetensors", + "model.layers.125.input_layernorm.weight": "model-00190-of-00191.safetensors", + "model.layers.125.mlp.down_proj.weight": "model-00190-of-00191.safetensors", + "model.layers.125.mlp.gate_proj.weight": "model-00189-of-00191.safetensors", + "model.layers.125.mlp.up_proj.weight": "model-00190-of-00191.safetensors", + "model.layers.125.post_attention_layernorm.weight": "model-00190-of-00191.safetensors", + "model.layers.125.self_attn.k_proj.weight": "model-00189-of-00191.safetensors", + "model.layers.125.self_attn.o_proj.weight": "model-00189-of-00191.safetensors", + "model.layers.125.self_attn.q_proj.weight": "model-00189-of-00191.safetensors", + "model.layers.125.self_attn.v_proj.weight": "model-00189-of-00191.safetensors", + "model.layers.13.input_layernorm.weight": "model-00022-of-00191.safetensors", + "model.layers.13.mlp.down_proj.weight": "model-00022-of-00191.safetensors", + "model.layers.13.mlp.gate_proj.weight": "model-00021-of-00191.safetensors", + "model.layers.13.mlp.up_proj.weight": "model-00022-of-00191.safetensors", + "model.layers.13.post_attention_layernorm.weight": "model-00022-of-00191.safetensors", + "model.layers.13.self_attn.k_proj.weight": "model-00021-of-00191.safetensors", + "model.layers.13.self_attn.o_proj.weight": "model-00021-of-00191.safetensors", + "model.layers.13.self_attn.q_proj.weight": "model-00021-of-00191.safetensors", + "model.layers.13.self_attn.v_proj.weight": "model-00021-of-00191.safetensors", + "model.layers.14.input_layernorm.weight": "model-00024-of-00191.safetensors", + "model.layers.14.mlp.down_proj.weight": "model-00024-of-00191.safetensors", + "model.layers.14.mlp.gate_proj.weight": "model-00023-of-00191.safetensors", + "model.layers.14.mlp.up_proj.weight": "model-00023-of-00191.safetensors", + "model.layers.14.post_attention_layernorm.weight": "model-00024-of-00191.safetensors", + "model.layers.14.self_attn.k_proj.weight": "model-00022-of-00191.safetensors", + "model.layers.14.self_attn.o_proj.weight": "model-00022-of-00191.safetensors", + "model.layers.14.self_attn.q_proj.weight": "model-00022-of-00191.safetensors", + "model.layers.14.self_attn.v_proj.weight": "model-00022-of-00191.safetensors", + "model.layers.15.input_layernorm.weight": "model-00025-of-00191.safetensors", + "model.layers.15.mlp.down_proj.weight": "model-00025-of-00191.safetensors", + "model.layers.15.mlp.gate_proj.weight": "model-00024-of-00191.safetensors", + "model.layers.15.mlp.up_proj.weight": "model-00025-of-00191.safetensors", + "model.layers.15.post_attention_layernorm.weight": "model-00025-of-00191.safetensors", + "model.layers.15.self_attn.k_proj.weight": "model-00024-of-00191.safetensors", + "model.layers.15.self_attn.o_proj.weight": "model-00024-of-00191.safetensors", + "model.layers.15.self_attn.q_proj.weight": "model-00024-of-00191.safetensors", + "model.layers.15.self_attn.v_proj.weight": "model-00024-of-00191.safetensors", + "model.layers.16.input_layernorm.weight": "model-00027-of-00191.safetensors", + "model.layers.16.mlp.down_proj.weight": "model-00027-of-00191.safetensors", + "model.layers.16.mlp.gate_proj.weight": "model-00026-of-00191.safetensors", + "model.layers.16.mlp.up_proj.weight": "model-00026-of-00191.safetensors", + "model.layers.16.post_attention_layernorm.weight": "model-00027-of-00191.safetensors", + "model.layers.16.self_attn.k_proj.weight": "model-00025-of-00191.safetensors", + "model.layers.16.self_attn.o_proj.weight": "model-00025-of-00191.safetensors", + "model.layers.16.self_attn.q_proj.weight": "model-00025-of-00191.safetensors", + "model.layers.16.self_attn.v_proj.weight": "model-00025-of-00191.safetensors", + "model.layers.17.input_layernorm.weight": "model-00028-of-00191.safetensors", + "model.layers.17.mlp.down_proj.weight": "model-00028-of-00191.safetensors", + "model.layers.17.mlp.gate_proj.weight": "model-00027-of-00191.safetensors", + "model.layers.17.mlp.up_proj.weight": "model-00028-of-00191.safetensors", + "model.layers.17.post_attention_layernorm.weight": "model-00028-of-00191.safetensors", + "model.layers.17.self_attn.k_proj.weight": "model-00027-of-00191.safetensors", + "model.layers.17.self_attn.o_proj.weight": "model-00027-of-00191.safetensors", + "model.layers.17.self_attn.q_proj.weight": "model-00027-of-00191.safetensors", + "model.layers.17.self_attn.v_proj.weight": "model-00027-of-00191.safetensors", + "model.layers.18.input_layernorm.weight": "model-00030-of-00191.safetensors", + "model.layers.18.mlp.down_proj.weight": "model-00030-of-00191.safetensors", + "model.layers.18.mlp.gate_proj.weight": "model-00029-of-00191.safetensors", + "model.layers.18.mlp.up_proj.weight": "model-00029-of-00191.safetensors", + "model.layers.18.post_attention_layernorm.weight": "model-00030-of-00191.safetensors", + "model.layers.18.self_attn.k_proj.weight": "model-00028-of-00191.safetensors", + "model.layers.18.self_attn.o_proj.weight": "model-00028-of-00191.safetensors", + "model.layers.18.self_attn.q_proj.weight": "model-00028-of-00191.safetensors", + "model.layers.18.self_attn.v_proj.weight": "model-00028-of-00191.safetensors", + "model.layers.19.input_layernorm.weight": "model-00031-of-00191.safetensors", + "model.layers.19.mlp.down_proj.weight": "model-00031-of-00191.safetensors", + "model.layers.19.mlp.gate_proj.weight": "model-00030-of-00191.safetensors", + "model.layers.19.mlp.up_proj.weight": "model-00031-of-00191.safetensors", + "model.layers.19.post_attention_layernorm.weight": "model-00031-of-00191.safetensors", + "model.layers.19.self_attn.k_proj.weight": "model-00030-of-00191.safetensors", + "model.layers.19.self_attn.o_proj.weight": "model-00030-of-00191.safetensors", + "model.layers.19.self_attn.q_proj.weight": "model-00030-of-00191.safetensors", + "model.layers.19.self_attn.v_proj.weight": "model-00030-of-00191.safetensors", + "model.layers.2.input_layernorm.weight": "model-00006-of-00191.safetensors", + "model.layers.2.mlp.down_proj.weight": "model-00006-of-00191.safetensors", + "model.layers.2.mlp.gate_proj.weight": "model-00005-of-00191.safetensors", + "model.layers.2.mlp.up_proj.weight": "model-00005-of-00191.safetensors", + "model.layers.2.post_attention_layernorm.weight": "model-00006-of-00191.safetensors", + "model.layers.2.self_attn.k_proj.weight": "model-00004-of-00191.safetensors", + "model.layers.2.self_attn.o_proj.weight": "model-00004-of-00191.safetensors", + "model.layers.2.self_attn.q_proj.weight": "model-00004-of-00191.safetensors", + "model.layers.2.self_attn.v_proj.weight": "model-00004-of-00191.safetensors", + "model.layers.20.input_layernorm.weight": "model-00033-of-00191.safetensors", + "model.layers.20.mlp.down_proj.weight": "model-00033-of-00191.safetensors", + "model.layers.20.mlp.gate_proj.weight": "model-00032-of-00191.safetensors", + "model.layers.20.mlp.up_proj.weight": "model-00032-of-00191.safetensors", + "model.layers.20.post_attention_layernorm.weight": "model-00033-of-00191.safetensors", + "model.layers.20.self_attn.k_proj.weight": "model-00031-of-00191.safetensors", + "model.layers.20.self_attn.o_proj.weight": "model-00031-of-00191.safetensors", + "model.layers.20.self_attn.q_proj.weight": "model-00031-of-00191.safetensors", + "model.layers.20.self_attn.v_proj.weight": "model-00031-of-00191.safetensors", + "model.layers.21.input_layernorm.weight": "model-00034-of-00191.safetensors", + "model.layers.21.mlp.down_proj.weight": "model-00034-of-00191.safetensors", + "model.layers.21.mlp.gate_proj.weight": "model-00033-of-00191.safetensors", + "model.layers.21.mlp.up_proj.weight": "model-00034-of-00191.safetensors", + "model.layers.21.post_attention_layernorm.weight": "model-00034-of-00191.safetensors", + "model.layers.21.self_attn.k_proj.weight": "model-00033-of-00191.safetensors", + "model.layers.21.self_attn.o_proj.weight": "model-00033-of-00191.safetensors", + "model.layers.21.self_attn.q_proj.weight": "model-00033-of-00191.safetensors", + "model.layers.21.self_attn.v_proj.weight": "model-00033-of-00191.safetensors", + "model.layers.22.input_layernorm.weight": "model-00036-of-00191.safetensors", + "model.layers.22.mlp.down_proj.weight": "model-00036-of-00191.safetensors", + "model.layers.22.mlp.gate_proj.weight": "model-00035-of-00191.safetensors", + "model.layers.22.mlp.up_proj.weight": "model-00035-of-00191.safetensors", + "model.layers.22.post_attention_layernorm.weight": "model-00036-of-00191.safetensors", + "model.layers.22.self_attn.k_proj.weight": "model-00034-of-00191.safetensors", + "model.layers.22.self_attn.o_proj.weight": "model-00034-of-00191.safetensors", + "model.layers.22.self_attn.q_proj.weight": "model-00034-of-00191.safetensors", + "model.layers.22.self_attn.v_proj.weight": "model-00034-of-00191.safetensors", + "model.layers.23.input_layernorm.weight": "model-00037-of-00191.safetensors", + "model.layers.23.mlp.down_proj.weight": "model-00037-of-00191.safetensors", + "model.layers.23.mlp.gate_proj.weight": "model-00036-of-00191.safetensors", + "model.layers.23.mlp.up_proj.weight": "model-00037-of-00191.safetensors", + "model.layers.23.post_attention_layernorm.weight": "model-00037-of-00191.safetensors", + "model.layers.23.self_attn.k_proj.weight": "model-00036-of-00191.safetensors", + "model.layers.23.self_attn.o_proj.weight": "model-00036-of-00191.safetensors", + "model.layers.23.self_attn.q_proj.weight": "model-00036-of-00191.safetensors", + "model.layers.23.self_attn.v_proj.weight": "model-00036-of-00191.safetensors", + "model.layers.24.input_layernorm.weight": "model-00039-of-00191.safetensors", + "model.layers.24.mlp.down_proj.weight": "model-00039-of-00191.safetensors", + "model.layers.24.mlp.gate_proj.weight": "model-00038-of-00191.safetensors", + "model.layers.24.mlp.up_proj.weight": "model-00038-of-00191.safetensors", + "model.layers.24.post_attention_layernorm.weight": "model-00039-of-00191.safetensors", + "model.layers.24.self_attn.k_proj.weight": "model-00037-of-00191.safetensors", + "model.layers.24.self_attn.o_proj.weight": "model-00037-of-00191.safetensors", + "model.layers.24.self_attn.q_proj.weight": "model-00037-of-00191.safetensors", + "model.layers.24.self_attn.v_proj.weight": "model-00037-of-00191.safetensors", + "model.layers.25.input_layernorm.weight": "model-00040-of-00191.safetensors", + "model.layers.25.mlp.down_proj.weight": "model-00040-of-00191.safetensors", + "model.layers.25.mlp.gate_proj.weight": "model-00039-of-00191.safetensors", + "model.layers.25.mlp.up_proj.weight": "model-00040-of-00191.safetensors", + "model.layers.25.post_attention_layernorm.weight": "model-00040-of-00191.safetensors", + "model.layers.25.self_attn.k_proj.weight": "model-00039-of-00191.safetensors", + "model.layers.25.self_attn.o_proj.weight": "model-00039-of-00191.safetensors", + "model.layers.25.self_attn.q_proj.weight": "model-00039-of-00191.safetensors", + "model.layers.25.self_attn.v_proj.weight": "model-00039-of-00191.safetensors", + "model.layers.26.input_layernorm.weight": "model-00042-of-00191.safetensors", + "model.layers.26.mlp.down_proj.weight": "model-00042-of-00191.safetensors", + "model.layers.26.mlp.gate_proj.weight": "model-00041-of-00191.safetensors", + "model.layers.26.mlp.up_proj.weight": "model-00041-of-00191.safetensors", + "model.layers.26.post_attention_layernorm.weight": "model-00042-of-00191.safetensors", + "model.layers.26.self_attn.k_proj.weight": "model-00040-of-00191.safetensors", + "model.layers.26.self_attn.o_proj.weight": "model-00040-of-00191.safetensors", + "model.layers.26.self_attn.q_proj.weight": "model-00040-of-00191.safetensors", + "model.layers.26.self_attn.v_proj.weight": "model-00040-of-00191.safetensors", + "model.layers.27.input_layernorm.weight": "model-00043-of-00191.safetensors", + "model.layers.27.mlp.down_proj.weight": "model-00043-of-00191.safetensors", + "model.layers.27.mlp.gate_proj.weight": "model-00042-of-00191.safetensors", + "model.layers.27.mlp.up_proj.weight": "model-00043-of-00191.safetensors", + "model.layers.27.post_attention_layernorm.weight": "model-00043-of-00191.safetensors", + "model.layers.27.self_attn.k_proj.weight": "model-00042-of-00191.safetensors", + "model.layers.27.self_attn.o_proj.weight": "model-00042-of-00191.safetensors", + "model.layers.27.self_attn.q_proj.weight": "model-00042-of-00191.safetensors", + "model.layers.27.self_attn.v_proj.weight": "model-00042-of-00191.safetensors", + "model.layers.28.input_layernorm.weight": "model-00045-of-00191.safetensors", + "model.layers.28.mlp.down_proj.weight": "model-00045-of-00191.safetensors", + "model.layers.28.mlp.gate_proj.weight": "model-00044-of-00191.safetensors", + "model.layers.28.mlp.up_proj.weight": "model-00044-of-00191.safetensors", + "model.layers.28.post_attention_layernorm.weight": "model-00045-of-00191.safetensors", + "model.layers.28.self_attn.k_proj.weight": "model-00043-of-00191.safetensors", + "model.layers.28.self_attn.o_proj.weight": "model-00043-of-00191.safetensors", + "model.layers.28.self_attn.q_proj.weight": "model-00043-of-00191.safetensors", + "model.layers.28.self_attn.v_proj.weight": "model-00043-of-00191.safetensors", + "model.layers.29.input_layernorm.weight": "model-00046-of-00191.safetensors", + "model.layers.29.mlp.down_proj.weight": "model-00046-of-00191.safetensors", + "model.layers.29.mlp.gate_proj.weight": "model-00045-of-00191.safetensors", + "model.layers.29.mlp.up_proj.weight": "model-00046-of-00191.safetensors", + "model.layers.29.post_attention_layernorm.weight": "model-00046-of-00191.safetensors", + "model.layers.29.self_attn.k_proj.weight": "model-00045-of-00191.safetensors", + "model.layers.29.self_attn.o_proj.weight": "model-00045-of-00191.safetensors", + "model.layers.29.self_attn.q_proj.weight": "model-00045-of-00191.safetensors", + "model.layers.29.self_attn.v_proj.weight": "model-00045-of-00191.safetensors", + "model.layers.3.input_layernorm.weight": "model-00007-of-00191.safetensors", + "model.layers.3.mlp.down_proj.weight": "model-00007-of-00191.safetensors", + "model.layers.3.mlp.gate_proj.weight": "model-00006-of-00191.safetensors", + "model.layers.3.mlp.up_proj.weight": "model-00007-of-00191.safetensors", + "model.layers.3.post_attention_layernorm.weight": "model-00007-of-00191.safetensors", + "model.layers.3.self_attn.k_proj.weight": "model-00006-of-00191.safetensors", + "model.layers.3.self_attn.o_proj.weight": "model-00006-of-00191.safetensors", + "model.layers.3.self_attn.q_proj.weight": "model-00006-of-00191.safetensors", + "model.layers.3.self_attn.v_proj.weight": "model-00006-of-00191.safetensors", + "model.layers.30.input_layernorm.weight": "model-00048-of-00191.safetensors", + "model.layers.30.mlp.down_proj.weight": "model-00048-of-00191.safetensors", + "model.layers.30.mlp.gate_proj.weight": "model-00047-of-00191.safetensors", + "model.layers.30.mlp.up_proj.weight": "model-00047-of-00191.safetensors", + "model.layers.30.post_attention_layernorm.weight": "model-00048-of-00191.safetensors", + "model.layers.30.self_attn.k_proj.weight": "model-00046-of-00191.safetensors", + "model.layers.30.self_attn.o_proj.weight": "model-00046-of-00191.safetensors", + "model.layers.30.self_attn.q_proj.weight": "model-00046-of-00191.safetensors", + "model.layers.30.self_attn.v_proj.weight": "model-00046-of-00191.safetensors", + "model.layers.31.input_layernorm.weight": "model-00049-of-00191.safetensors", + "model.layers.31.mlp.down_proj.weight": "model-00049-of-00191.safetensors", + "model.layers.31.mlp.gate_proj.weight": "model-00048-of-00191.safetensors", + "model.layers.31.mlp.up_proj.weight": "model-00049-of-00191.safetensors", + "model.layers.31.post_attention_layernorm.weight": "model-00049-of-00191.safetensors", + "model.layers.31.self_attn.k_proj.weight": "model-00048-of-00191.safetensors", + "model.layers.31.self_attn.o_proj.weight": "model-00048-of-00191.safetensors", + "model.layers.31.self_attn.q_proj.weight": "model-00048-of-00191.safetensors", + "model.layers.31.self_attn.v_proj.weight": "model-00048-of-00191.safetensors", + "model.layers.32.input_layernorm.weight": "model-00051-of-00191.safetensors", + "model.layers.32.mlp.down_proj.weight": "model-00051-of-00191.safetensors", + "model.layers.32.mlp.gate_proj.weight": "model-00050-of-00191.safetensors", + "model.layers.32.mlp.up_proj.weight": "model-00050-of-00191.safetensors", + "model.layers.32.post_attention_layernorm.weight": "model-00051-of-00191.safetensors", + "model.layers.32.self_attn.k_proj.weight": "model-00049-of-00191.safetensors", + "model.layers.32.self_attn.o_proj.weight": "model-00049-of-00191.safetensors", + "model.layers.32.self_attn.q_proj.weight": "model-00049-of-00191.safetensors", + "model.layers.32.self_attn.v_proj.weight": "model-00049-of-00191.safetensors", + "model.layers.33.input_layernorm.weight": "model-00052-of-00191.safetensors", + "model.layers.33.mlp.down_proj.weight": "model-00052-of-00191.safetensors", + "model.layers.33.mlp.gate_proj.weight": "model-00051-of-00191.safetensors", + "model.layers.33.mlp.up_proj.weight": "model-00052-of-00191.safetensors", + "model.layers.33.post_attention_layernorm.weight": "model-00052-of-00191.safetensors", + "model.layers.33.self_attn.k_proj.weight": "model-00051-of-00191.safetensors", + "model.layers.33.self_attn.o_proj.weight": "model-00051-of-00191.safetensors", + "model.layers.33.self_attn.q_proj.weight": "model-00051-of-00191.safetensors", + "model.layers.33.self_attn.v_proj.weight": "model-00051-of-00191.safetensors", + "model.layers.34.input_layernorm.weight": "model-00054-of-00191.safetensors", + "model.layers.34.mlp.down_proj.weight": "model-00054-of-00191.safetensors", + "model.layers.34.mlp.gate_proj.weight": "model-00053-of-00191.safetensors", + "model.layers.34.mlp.up_proj.weight": "model-00053-of-00191.safetensors", + "model.layers.34.post_attention_layernorm.weight": "model-00054-of-00191.safetensors", + "model.layers.34.self_attn.k_proj.weight": "model-00052-of-00191.safetensors", + "model.layers.34.self_attn.o_proj.weight": "model-00052-of-00191.safetensors", + "model.layers.34.self_attn.q_proj.weight": "model-00052-of-00191.safetensors", + "model.layers.34.self_attn.v_proj.weight": "model-00052-of-00191.safetensors", + "model.layers.35.input_layernorm.weight": "model-00055-of-00191.safetensors", + "model.layers.35.mlp.down_proj.weight": "model-00055-of-00191.safetensors", + "model.layers.35.mlp.gate_proj.weight": "model-00054-of-00191.safetensors", + "model.layers.35.mlp.up_proj.weight": "model-00055-of-00191.safetensors", + "model.layers.35.post_attention_layernorm.weight": "model-00055-of-00191.safetensors", + "model.layers.35.self_attn.k_proj.weight": "model-00054-of-00191.safetensors", + "model.layers.35.self_attn.o_proj.weight": "model-00054-of-00191.safetensors", + "model.layers.35.self_attn.q_proj.weight": "model-00054-of-00191.safetensors", + "model.layers.35.self_attn.v_proj.weight": "model-00054-of-00191.safetensors", + "model.layers.36.input_layernorm.weight": "model-00057-of-00191.safetensors", + "model.layers.36.mlp.down_proj.weight": "model-00057-of-00191.safetensors", + "model.layers.36.mlp.gate_proj.weight": "model-00056-of-00191.safetensors", + "model.layers.36.mlp.up_proj.weight": "model-00056-of-00191.safetensors", + "model.layers.36.post_attention_layernorm.weight": "model-00057-of-00191.safetensors", + "model.layers.36.self_attn.k_proj.weight": "model-00055-of-00191.safetensors", + "model.layers.36.self_attn.o_proj.weight": "model-00055-of-00191.safetensors", + "model.layers.36.self_attn.q_proj.weight": "model-00055-of-00191.safetensors", + "model.layers.36.self_attn.v_proj.weight": "model-00055-of-00191.safetensors", + "model.layers.37.input_layernorm.weight": "model-00058-of-00191.safetensors", + "model.layers.37.mlp.down_proj.weight": "model-00058-of-00191.safetensors", + "model.layers.37.mlp.gate_proj.weight": "model-00057-of-00191.safetensors", + "model.layers.37.mlp.up_proj.weight": "model-00058-of-00191.safetensors", + "model.layers.37.post_attention_layernorm.weight": "model-00058-of-00191.safetensors", + "model.layers.37.self_attn.k_proj.weight": "model-00057-of-00191.safetensors", + "model.layers.37.self_attn.o_proj.weight": "model-00057-of-00191.safetensors", + "model.layers.37.self_attn.q_proj.weight": "model-00057-of-00191.safetensors", + "model.layers.37.self_attn.v_proj.weight": "model-00057-of-00191.safetensors", + "model.layers.38.input_layernorm.weight": "model-00060-of-00191.safetensors", + "model.layers.38.mlp.down_proj.weight": "model-00060-of-00191.safetensors", + "model.layers.38.mlp.gate_proj.weight": "model-00059-of-00191.safetensors", + "model.layers.38.mlp.up_proj.weight": "model-00059-of-00191.safetensors", + "model.layers.38.post_attention_layernorm.weight": "model-00060-of-00191.safetensors", + "model.layers.38.self_attn.k_proj.weight": "model-00058-of-00191.safetensors", + "model.layers.38.self_attn.o_proj.weight": "model-00058-of-00191.safetensors", + "model.layers.38.self_attn.q_proj.weight": "model-00058-of-00191.safetensors", + "model.layers.38.self_attn.v_proj.weight": "model-00058-of-00191.safetensors", + "model.layers.39.input_layernorm.weight": "model-00061-of-00191.safetensors", + "model.layers.39.mlp.down_proj.weight": "model-00061-of-00191.safetensors", + "model.layers.39.mlp.gate_proj.weight": "model-00060-of-00191.safetensors", + "model.layers.39.mlp.up_proj.weight": "model-00061-of-00191.safetensors", + "model.layers.39.post_attention_layernorm.weight": "model-00061-of-00191.safetensors", + "model.layers.39.self_attn.k_proj.weight": "model-00060-of-00191.safetensors", + "model.layers.39.self_attn.o_proj.weight": "model-00060-of-00191.safetensors", + "model.layers.39.self_attn.q_proj.weight": "model-00060-of-00191.safetensors", + "model.layers.39.self_attn.v_proj.weight": "model-00060-of-00191.safetensors", + "model.layers.4.input_layernorm.weight": "model-00009-of-00191.safetensors", + "model.layers.4.mlp.down_proj.weight": "model-00009-of-00191.safetensors", + "model.layers.4.mlp.gate_proj.weight": "model-00008-of-00191.safetensors", + "model.layers.4.mlp.up_proj.weight": "model-00008-of-00191.safetensors", + "model.layers.4.post_attention_layernorm.weight": "model-00009-of-00191.safetensors", + "model.layers.4.self_attn.k_proj.weight": "model-00007-of-00191.safetensors", + "model.layers.4.self_attn.o_proj.weight": "model-00007-of-00191.safetensors", + "model.layers.4.self_attn.q_proj.weight": "model-00007-of-00191.safetensors", + "model.layers.4.self_attn.v_proj.weight": "model-00007-of-00191.safetensors", + "model.layers.40.input_layernorm.weight": "model-00063-of-00191.safetensors", + "model.layers.40.mlp.down_proj.weight": "model-00063-of-00191.safetensors", + "model.layers.40.mlp.gate_proj.weight": "model-00062-of-00191.safetensors", + "model.layers.40.mlp.up_proj.weight": "model-00062-of-00191.safetensors", + "model.layers.40.post_attention_layernorm.weight": "model-00063-of-00191.safetensors", + "model.layers.40.self_attn.k_proj.weight": "model-00061-of-00191.safetensors", + "model.layers.40.self_attn.o_proj.weight": "model-00061-of-00191.safetensors", + "model.layers.40.self_attn.q_proj.weight": "model-00061-of-00191.safetensors", + "model.layers.40.self_attn.v_proj.weight": "model-00061-of-00191.safetensors", + "model.layers.41.input_layernorm.weight": "model-00064-of-00191.safetensors", + "model.layers.41.mlp.down_proj.weight": "model-00064-of-00191.safetensors", + "model.layers.41.mlp.gate_proj.weight": "model-00063-of-00191.safetensors", + "model.layers.41.mlp.up_proj.weight": "model-00064-of-00191.safetensors", + "model.layers.41.post_attention_layernorm.weight": "model-00064-of-00191.safetensors", + "model.layers.41.self_attn.k_proj.weight": "model-00063-of-00191.safetensors", + "model.layers.41.self_attn.o_proj.weight": "model-00063-of-00191.safetensors", + "model.layers.41.self_attn.q_proj.weight": "model-00063-of-00191.safetensors", + "model.layers.41.self_attn.v_proj.weight": "model-00063-of-00191.safetensors", + "model.layers.42.input_layernorm.weight": "model-00066-of-00191.safetensors", + "model.layers.42.mlp.down_proj.weight": "model-00066-of-00191.safetensors", + "model.layers.42.mlp.gate_proj.weight": "model-00065-of-00191.safetensors", + "model.layers.42.mlp.up_proj.weight": "model-00065-of-00191.safetensors", + "model.layers.42.post_attention_layernorm.weight": "model-00066-of-00191.safetensors", + "model.layers.42.self_attn.k_proj.weight": "model-00064-of-00191.safetensors", + "model.layers.42.self_attn.o_proj.weight": "model-00064-of-00191.safetensors", + "model.layers.42.self_attn.q_proj.weight": "model-00064-of-00191.safetensors", + "model.layers.42.self_attn.v_proj.weight": "model-00064-of-00191.safetensors", + "model.layers.43.input_layernorm.weight": "model-00067-of-00191.safetensors", + "model.layers.43.mlp.down_proj.weight": "model-00067-of-00191.safetensors", + "model.layers.43.mlp.gate_proj.weight": "model-00066-of-00191.safetensors", + "model.layers.43.mlp.up_proj.weight": "model-00067-of-00191.safetensors", + "model.layers.43.post_attention_layernorm.weight": "model-00067-of-00191.safetensors", + "model.layers.43.self_attn.k_proj.weight": "model-00066-of-00191.safetensors", + "model.layers.43.self_attn.o_proj.weight": "model-00066-of-00191.safetensors", + "model.layers.43.self_attn.q_proj.weight": "model-00066-of-00191.safetensors", + "model.layers.43.self_attn.v_proj.weight": "model-00066-of-00191.safetensors", + "model.layers.44.input_layernorm.weight": "model-00069-of-00191.safetensors", + "model.layers.44.mlp.down_proj.weight": "model-00069-of-00191.safetensors", + "model.layers.44.mlp.gate_proj.weight": "model-00068-of-00191.safetensors", + "model.layers.44.mlp.up_proj.weight": "model-00068-of-00191.safetensors", + "model.layers.44.post_attention_layernorm.weight": "model-00069-of-00191.safetensors", + "model.layers.44.self_attn.k_proj.weight": "model-00067-of-00191.safetensors", + "model.layers.44.self_attn.o_proj.weight": "model-00067-of-00191.safetensors", + "model.layers.44.self_attn.q_proj.weight": "model-00067-of-00191.safetensors", + "model.layers.44.self_attn.v_proj.weight": "model-00067-of-00191.safetensors", + "model.layers.45.input_layernorm.weight": "model-00070-of-00191.safetensors", + "model.layers.45.mlp.down_proj.weight": "model-00070-of-00191.safetensors", + "model.layers.45.mlp.gate_proj.weight": "model-00069-of-00191.safetensors", + "model.layers.45.mlp.up_proj.weight": "model-00070-of-00191.safetensors", + "model.layers.45.post_attention_layernorm.weight": "model-00070-of-00191.safetensors", + "model.layers.45.self_attn.k_proj.weight": "model-00069-of-00191.safetensors", + "model.layers.45.self_attn.o_proj.weight": "model-00069-of-00191.safetensors", + "model.layers.45.self_attn.q_proj.weight": "model-00069-of-00191.safetensors", + "model.layers.45.self_attn.v_proj.weight": "model-00069-of-00191.safetensors", + "model.layers.46.input_layernorm.weight": "model-00072-of-00191.safetensors", + "model.layers.46.mlp.down_proj.weight": "model-00072-of-00191.safetensors", + "model.layers.46.mlp.gate_proj.weight": "model-00071-of-00191.safetensors", + "model.layers.46.mlp.up_proj.weight": "model-00071-of-00191.safetensors", + "model.layers.46.post_attention_layernorm.weight": "model-00072-of-00191.safetensors", + "model.layers.46.self_attn.k_proj.weight": "model-00070-of-00191.safetensors", + "model.layers.46.self_attn.o_proj.weight": "model-00070-of-00191.safetensors", + "model.layers.46.self_attn.q_proj.weight": "model-00070-of-00191.safetensors", + "model.layers.46.self_attn.v_proj.weight": "model-00070-of-00191.safetensors", + "model.layers.47.input_layernorm.weight": "model-00073-of-00191.safetensors", + "model.layers.47.mlp.down_proj.weight": "model-00073-of-00191.safetensors", + "model.layers.47.mlp.gate_proj.weight": "model-00072-of-00191.safetensors", + "model.layers.47.mlp.up_proj.weight": "model-00073-of-00191.safetensors", + "model.layers.47.post_attention_layernorm.weight": "model-00073-of-00191.safetensors", + "model.layers.47.self_attn.k_proj.weight": "model-00072-of-00191.safetensors", + "model.layers.47.self_attn.o_proj.weight": "model-00072-of-00191.safetensors", + "model.layers.47.self_attn.q_proj.weight": "model-00072-of-00191.safetensors", + "model.layers.47.self_attn.v_proj.weight": "model-00072-of-00191.safetensors", + "model.layers.48.input_layernorm.weight": "model-00075-of-00191.safetensors", + "model.layers.48.mlp.down_proj.weight": "model-00075-of-00191.safetensors", + "model.layers.48.mlp.gate_proj.weight": "model-00074-of-00191.safetensors", + "model.layers.48.mlp.up_proj.weight": "model-00074-of-00191.safetensors", + "model.layers.48.post_attention_layernorm.weight": "model-00075-of-00191.safetensors", + "model.layers.48.self_attn.k_proj.weight": "model-00073-of-00191.safetensors", + "model.layers.48.self_attn.o_proj.weight": "model-00073-of-00191.safetensors", + "model.layers.48.self_attn.q_proj.weight": "model-00073-of-00191.safetensors", + "model.layers.48.self_attn.v_proj.weight": "model-00073-of-00191.safetensors", + "model.layers.49.input_layernorm.weight": "model-00076-of-00191.safetensors", + "model.layers.49.mlp.down_proj.weight": "model-00076-of-00191.safetensors", + "model.layers.49.mlp.gate_proj.weight": "model-00075-of-00191.safetensors", + "model.layers.49.mlp.up_proj.weight": "model-00076-of-00191.safetensors", + "model.layers.49.post_attention_layernorm.weight": "model-00076-of-00191.safetensors", + "model.layers.49.self_attn.k_proj.weight": "model-00075-of-00191.safetensors", + "model.layers.49.self_attn.o_proj.weight": "model-00075-of-00191.safetensors", + "model.layers.49.self_attn.q_proj.weight": "model-00075-of-00191.safetensors", + "model.layers.49.self_attn.v_proj.weight": "model-00075-of-00191.safetensors", + "model.layers.5.input_layernorm.weight": "model-00010-of-00191.safetensors", + "model.layers.5.mlp.down_proj.weight": "model-00010-of-00191.safetensors", + "model.layers.5.mlp.gate_proj.weight": "model-00009-of-00191.safetensors", + "model.layers.5.mlp.up_proj.weight": "model-00010-of-00191.safetensors", + "model.layers.5.post_attention_layernorm.weight": "model-00010-of-00191.safetensors", + "model.layers.5.self_attn.k_proj.weight": "model-00009-of-00191.safetensors", + "model.layers.5.self_attn.o_proj.weight": "model-00009-of-00191.safetensors", + "model.layers.5.self_attn.q_proj.weight": "model-00009-of-00191.safetensors", + "model.layers.5.self_attn.v_proj.weight": "model-00009-of-00191.safetensors", + "model.layers.50.input_layernorm.weight": "model-00078-of-00191.safetensors", + "model.layers.50.mlp.down_proj.weight": "model-00078-of-00191.safetensors", + "model.layers.50.mlp.gate_proj.weight": "model-00077-of-00191.safetensors", + "model.layers.50.mlp.up_proj.weight": "model-00077-of-00191.safetensors", + "model.layers.50.post_attention_layernorm.weight": "model-00078-of-00191.safetensors", + "model.layers.50.self_attn.k_proj.weight": "model-00076-of-00191.safetensors", + "model.layers.50.self_attn.o_proj.weight": "model-00076-of-00191.safetensors", + "model.layers.50.self_attn.q_proj.weight": "model-00076-of-00191.safetensors", + "model.layers.50.self_attn.v_proj.weight": "model-00076-of-00191.safetensors", + "model.layers.51.input_layernorm.weight": "model-00079-of-00191.safetensors", + "model.layers.51.mlp.down_proj.weight": "model-00079-of-00191.safetensors", + "model.layers.51.mlp.gate_proj.weight": "model-00078-of-00191.safetensors", + "model.layers.51.mlp.up_proj.weight": "model-00079-of-00191.safetensors", + "model.layers.51.post_attention_layernorm.weight": "model-00079-of-00191.safetensors", + "model.layers.51.self_attn.k_proj.weight": "model-00078-of-00191.safetensors", + "model.layers.51.self_attn.o_proj.weight": "model-00078-of-00191.safetensors", + "model.layers.51.self_attn.q_proj.weight": "model-00078-of-00191.safetensors", + "model.layers.51.self_attn.v_proj.weight": "model-00078-of-00191.safetensors", + "model.layers.52.input_layernorm.weight": "model-00081-of-00191.safetensors", + "model.layers.52.mlp.down_proj.weight": "model-00081-of-00191.safetensors", + "model.layers.52.mlp.gate_proj.weight": "model-00080-of-00191.safetensors", + "model.layers.52.mlp.up_proj.weight": "model-00080-of-00191.safetensors", + "model.layers.52.post_attention_layernorm.weight": "model-00081-of-00191.safetensors", + "model.layers.52.self_attn.k_proj.weight": "model-00079-of-00191.safetensors", + "model.layers.52.self_attn.o_proj.weight": "model-00079-of-00191.safetensors", + "model.layers.52.self_attn.q_proj.weight": "model-00079-of-00191.safetensors", + "model.layers.52.self_attn.v_proj.weight": "model-00079-of-00191.safetensors", + "model.layers.53.input_layernorm.weight": "model-00082-of-00191.safetensors", + "model.layers.53.mlp.down_proj.weight": "model-00082-of-00191.safetensors", + "model.layers.53.mlp.gate_proj.weight": "model-00081-of-00191.safetensors", + "model.layers.53.mlp.up_proj.weight": "model-00082-of-00191.safetensors", + "model.layers.53.post_attention_layernorm.weight": "model-00082-of-00191.safetensors", + "model.layers.53.self_attn.k_proj.weight": "model-00081-of-00191.safetensors", + "model.layers.53.self_attn.o_proj.weight": "model-00081-of-00191.safetensors", + "model.layers.53.self_attn.q_proj.weight": "model-00081-of-00191.safetensors", + "model.layers.53.self_attn.v_proj.weight": "model-00081-of-00191.safetensors", + "model.layers.54.input_layernorm.weight": "model-00084-of-00191.safetensors", + "model.layers.54.mlp.down_proj.weight": "model-00084-of-00191.safetensors", + "model.layers.54.mlp.gate_proj.weight": "model-00083-of-00191.safetensors", + "model.layers.54.mlp.up_proj.weight": "model-00083-of-00191.safetensors", + "model.layers.54.post_attention_layernorm.weight": "model-00084-of-00191.safetensors", + "model.layers.54.self_attn.k_proj.weight": "model-00082-of-00191.safetensors", + "model.layers.54.self_attn.o_proj.weight": "model-00082-of-00191.safetensors", + "model.layers.54.self_attn.q_proj.weight": "model-00082-of-00191.safetensors", + "model.layers.54.self_attn.v_proj.weight": "model-00082-of-00191.safetensors", + "model.layers.55.input_layernorm.weight": "model-00085-of-00191.safetensors", + "model.layers.55.mlp.down_proj.weight": "model-00085-of-00191.safetensors", + "model.layers.55.mlp.gate_proj.weight": "model-00084-of-00191.safetensors", + "model.layers.55.mlp.up_proj.weight": "model-00085-of-00191.safetensors", + "model.layers.55.post_attention_layernorm.weight": "model-00085-of-00191.safetensors", + "model.layers.55.self_attn.k_proj.weight": "model-00084-of-00191.safetensors", + "model.layers.55.self_attn.o_proj.weight": "model-00084-of-00191.safetensors", + "model.layers.55.self_attn.q_proj.weight": "model-00084-of-00191.safetensors", + "model.layers.55.self_attn.v_proj.weight": "model-00084-of-00191.safetensors", + "model.layers.56.input_layernorm.weight": "model-00087-of-00191.safetensors", + "model.layers.56.mlp.down_proj.weight": "model-00087-of-00191.safetensors", + "model.layers.56.mlp.gate_proj.weight": "model-00086-of-00191.safetensors", + "model.layers.56.mlp.up_proj.weight": "model-00086-of-00191.safetensors", + "model.layers.56.post_attention_layernorm.weight": "model-00087-of-00191.safetensors", + "model.layers.56.self_attn.k_proj.weight": "model-00085-of-00191.safetensors", + "model.layers.56.self_attn.o_proj.weight": "model-00085-of-00191.safetensors", + "model.layers.56.self_attn.q_proj.weight": "model-00085-of-00191.safetensors", + "model.layers.56.self_attn.v_proj.weight": "model-00085-of-00191.safetensors", + "model.layers.57.input_layernorm.weight": "model-00088-of-00191.safetensors", + "model.layers.57.mlp.down_proj.weight": "model-00088-of-00191.safetensors", + "model.layers.57.mlp.gate_proj.weight": "model-00087-of-00191.safetensors", + "model.layers.57.mlp.up_proj.weight": "model-00088-of-00191.safetensors", + "model.layers.57.post_attention_layernorm.weight": "model-00088-of-00191.safetensors", + "model.layers.57.self_attn.k_proj.weight": "model-00087-of-00191.safetensors", + "model.layers.57.self_attn.o_proj.weight": "model-00087-of-00191.safetensors", + "model.layers.57.self_attn.q_proj.weight": "model-00087-of-00191.safetensors", + "model.layers.57.self_attn.v_proj.weight": "model-00087-of-00191.safetensors", + "model.layers.58.input_layernorm.weight": "model-00090-of-00191.safetensors", + "model.layers.58.mlp.down_proj.weight": "model-00090-of-00191.safetensors", + "model.layers.58.mlp.gate_proj.weight": "model-00089-of-00191.safetensors", + "model.layers.58.mlp.up_proj.weight": "model-00089-of-00191.safetensors", + "model.layers.58.post_attention_layernorm.weight": "model-00090-of-00191.safetensors", + "model.layers.58.self_attn.k_proj.weight": "model-00088-of-00191.safetensors", + "model.layers.58.self_attn.o_proj.weight": "model-00088-of-00191.safetensors", + "model.layers.58.self_attn.q_proj.weight": "model-00088-of-00191.safetensors", + "model.layers.58.self_attn.v_proj.weight": "model-00088-of-00191.safetensors", + "model.layers.59.input_layernorm.weight": "model-00091-of-00191.safetensors", + "model.layers.59.mlp.down_proj.weight": "model-00091-of-00191.safetensors", + "model.layers.59.mlp.gate_proj.weight": "model-00090-of-00191.safetensors", + "model.layers.59.mlp.up_proj.weight": "model-00091-of-00191.safetensors", + "model.layers.59.post_attention_layernorm.weight": "model-00091-of-00191.safetensors", + "model.layers.59.self_attn.k_proj.weight": "model-00090-of-00191.safetensors", + "model.layers.59.self_attn.o_proj.weight": "model-00090-of-00191.safetensors", + "model.layers.59.self_attn.q_proj.weight": "model-00090-of-00191.safetensors", + "model.layers.59.self_attn.v_proj.weight": "model-00090-of-00191.safetensors", + "model.layers.6.input_layernorm.weight": "model-00012-of-00191.safetensors", + "model.layers.6.mlp.down_proj.weight": "model-00012-of-00191.safetensors", + "model.layers.6.mlp.gate_proj.weight": "model-00011-of-00191.safetensors", + "model.layers.6.mlp.up_proj.weight": "model-00011-of-00191.safetensors", + "model.layers.6.post_attention_layernorm.weight": "model-00012-of-00191.safetensors", + "model.layers.6.self_attn.k_proj.weight": "model-00010-of-00191.safetensors", + "model.layers.6.self_attn.o_proj.weight": "model-00010-of-00191.safetensors", + "model.layers.6.self_attn.q_proj.weight": "model-00010-of-00191.safetensors", + "model.layers.6.self_attn.v_proj.weight": "model-00010-of-00191.safetensors", + "model.layers.60.input_layernorm.weight": "model-00093-of-00191.safetensors", + "model.layers.60.mlp.down_proj.weight": "model-00093-of-00191.safetensors", + "model.layers.60.mlp.gate_proj.weight": "model-00092-of-00191.safetensors", + "model.layers.60.mlp.up_proj.weight": "model-00092-of-00191.safetensors", + "model.layers.60.post_attention_layernorm.weight": "model-00093-of-00191.safetensors", + "model.layers.60.self_attn.k_proj.weight": "model-00091-of-00191.safetensors", + "model.layers.60.self_attn.o_proj.weight": "model-00091-of-00191.safetensors", + "model.layers.60.self_attn.q_proj.weight": "model-00091-of-00191.safetensors", + "model.layers.60.self_attn.v_proj.weight": "model-00091-of-00191.safetensors", + "model.layers.61.input_layernorm.weight": "model-00094-of-00191.safetensors", + "model.layers.61.mlp.down_proj.weight": "model-00094-of-00191.safetensors", + "model.layers.61.mlp.gate_proj.weight": "model-00093-of-00191.safetensors", + "model.layers.61.mlp.up_proj.weight": "model-00094-of-00191.safetensors", + "model.layers.61.post_attention_layernorm.weight": "model-00094-of-00191.safetensors", + "model.layers.61.self_attn.k_proj.weight": "model-00093-of-00191.safetensors", + "model.layers.61.self_attn.o_proj.weight": "model-00093-of-00191.safetensors", + "model.layers.61.self_attn.q_proj.weight": "model-00093-of-00191.safetensors", + "model.layers.61.self_attn.v_proj.weight": "model-00093-of-00191.safetensors", + "model.layers.62.input_layernorm.weight": "model-00096-of-00191.safetensors", + "model.layers.62.mlp.down_proj.weight": "model-00096-of-00191.safetensors", + "model.layers.62.mlp.gate_proj.weight": "model-00095-of-00191.safetensors", + "model.layers.62.mlp.up_proj.weight": "model-00095-of-00191.safetensors", + "model.layers.62.post_attention_layernorm.weight": "model-00096-of-00191.safetensors", + "model.layers.62.self_attn.k_proj.weight": "model-00094-of-00191.safetensors", + "model.layers.62.self_attn.o_proj.weight": "model-00094-of-00191.safetensors", + "model.layers.62.self_attn.q_proj.weight": "model-00094-of-00191.safetensors", + "model.layers.62.self_attn.v_proj.weight": "model-00094-of-00191.safetensors", + "model.layers.63.input_layernorm.weight": "model-00097-of-00191.safetensors", + "model.layers.63.mlp.down_proj.weight": "model-00097-of-00191.safetensors", + "model.layers.63.mlp.gate_proj.weight": "model-00096-of-00191.safetensors", + "model.layers.63.mlp.up_proj.weight": "model-00097-of-00191.safetensors", + "model.layers.63.post_attention_layernorm.weight": "model-00097-of-00191.safetensors", + "model.layers.63.self_attn.k_proj.weight": "model-00096-of-00191.safetensors", + "model.layers.63.self_attn.o_proj.weight": "model-00096-of-00191.safetensors", + "model.layers.63.self_attn.q_proj.weight": "model-00096-of-00191.safetensors", + "model.layers.63.self_attn.v_proj.weight": "model-00096-of-00191.safetensors", + "model.layers.64.input_layernorm.weight": "model-00099-of-00191.safetensors", + "model.layers.64.mlp.down_proj.weight": "model-00099-of-00191.safetensors", + "model.layers.64.mlp.gate_proj.weight": "model-00098-of-00191.safetensors", + "model.layers.64.mlp.up_proj.weight": "model-00098-of-00191.safetensors", + "model.layers.64.post_attention_layernorm.weight": "model-00099-of-00191.safetensors", + "model.layers.64.self_attn.k_proj.weight": "model-00097-of-00191.safetensors", + "model.layers.64.self_attn.o_proj.weight": "model-00097-of-00191.safetensors", + "model.layers.64.self_attn.q_proj.weight": "model-00097-of-00191.safetensors", + "model.layers.64.self_attn.v_proj.weight": "model-00097-of-00191.safetensors", + "model.layers.65.input_layernorm.weight": "model-00100-of-00191.safetensors", + "model.layers.65.mlp.down_proj.weight": "model-00100-of-00191.safetensors", + "model.layers.65.mlp.gate_proj.weight": "model-00099-of-00191.safetensors", + "model.layers.65.mlp.up_proj.weight": "model-00100-of-00191.safetensors", + "model.layers.65.post_attention_layernorm.weight": "model-00100-of-00191.safetensors", + "model.layers.65.self_attn.k_proj.weight": "model-00099-of-00191.safetensors", + "model.layers.65.self_attn.o_proj.weight": "model-00099-of-00191.safetensors", + "model.layers.65.self_attn.q_proj.weight": "model-00099-of-00191.safetensors", + "model.layers.65.self_attn.v_proj.weight": "model-00099-of-00191.safetensors", + "model.layers.66.input_layernorm.weight": "model-00102-of-00191.safetensors", + "model.layers.66.mlp.down_proj.weight": "model-00102-of-00191.safetensors", + "model.layers.66.mlp.gate_proj.weight": "model-00101-of-00191.safetensors", + "model.layers.66.mlp.up_proj.weight": "model-00101-of-00191.safetensors", + "model.layers.66.post_attention_layernorm.weight": "model-00102-of-00191.safetensors", + "model.layers.66.self_attn.k_proj.weight": "model-00100-of-00191.safetensors", + "model.layers.66.self_attn.o_proj.weight": "model-00100-of-00191.safetensors", + "model.layers.66.self_attn.q_proj.weight": "model-00100-of-00191.safetensors", + "model.layers.66.self_attn.v_proj.weight": "model-00100-of-00191.safetensors", + "model.layers.67.input_layernorm.weight": "model-00103-of-00191.safetensors", + "model.layers.67.mlp.down_proj.weight": "model-00103-of-00191.safetensors", + "model.layers.67.mlp.gate_proj.weight": "model-00102-of-00191.safetensors", + "model.layers.67.mlp.up_proj.weight": "model-00103-of-00191.safetensors", + "model.layers.67.post_attention_layernorm.weight": "model-00103-of-00191.safetensors", + "model.layers.67.self_attn.k_proj.weight": "model-00102-of-00191.safetensors", + "model.layers.67.self_attn.o_proj.weight": "model-00102-of-00191.safetensors", + "model.layers.67.self_attn.q_proj.weight": "model-00102-of-00191.safetensors", + "model.layers.67.self_attn.v_proj.weight": "model-00102-of-00191.safetensors", + "model.layers.68.input_layernorm.weight": "model-00105-of-00191.safetensors", + "model.layers.68.mlp.down_proj.weight": "model-00105-of-00191.safetensors", + "model.layers.68.mlp.gate_proj.weight": "model-00104-of-00191.safetensors", + "model.layers.68.mlp.up_proj.weight": "model-00104-of-00191.safetensors", + "model.layers.68.post_attention_layernorm.weight": "model-00105-of-00191.safetensors", + "model.layers.68.self_attn.k_proj.weight": "model-00103-of-00191.safetensors", + "model.layers.68.self_attn.o_proj.weight": "model-00103-of-00191.safetensors", + "model.layers.68.self_attn.q_proj.weight": "model-00103-of-00191.safetensors", + "model.layers.68.self_attn.v_proj.weight": "model-00103-of-00191.safetensors", + "model.layers.69.input_layernorm.weight": "model-00106-of-00191.safetensors", + "model.layers.69.mlp.down_proj.weight": "model-00106-of-00191.safetensors", + "model.layers.69.mlp.gate_proj.weight": "model-00105-of-00191.safetensors", + "model.layers.69.mlp.up_proj.weight": "model-00106-of-00191.safetensors", + "model.layers.69.post_attention_layernorm.weight": "model-00106-of-00191.safetensors", + "model.layers.69.self_attn.k_proj.weight": "model-00105-of-00191.safetensors", + "model.layers.69.self_attn.o_proj.weight": "model-00105-of-00191.safetensors", + "model.layers.69.self_attn.q_proj.weight": "model-00105-of-00191.safetensors", + "model.layers.69.self_attn.v_proj.weight": "model-00105-of-00191.safetensors", + "model.layers.7.input_layernorm.weight": "model-00013-of-00191.safetensors", + "model.layers.7.mlp.down_proj.weight": "model-00013-of-00191.safetensors", + "model.layers.7.mlp.gate_proj.weight": "model-00012-of-00191.safetensors", + "model.layers.7.mlp.up_proj.weight": "model-00013-of-00191.safetensors", + "model.layers.7.post_attention_layernorm.weight": "model-00013-of-00191.safetensors", + "model.layers.7.self_attn.k_proj.weight": "model-00012-of-00191.safetensors", + "model.layers.7.self_attn.o_proj.weight": "model-00012-of-00191.safetensors", + "model.layers.7.self_attn.q_proj.weight": "model-00012-of-00191.safetensors", + "model.layers.7.self_attn.v_proj.weight": "model-00012-of-00191.safetensors", + "model.layers.70.input_layernorm.weight": "model-00108-of-00191.safetensors", + "model.layers.70.mlp.down_proj.weight": "model-00108-of-00191.safetensors", + "model.layers.70.mlp.gate_proj.weight": "model-00107-of-00191.safetensors", + "model.layers.70.mlp.up_proj.weight": "model-00107-of-00191.safetensors", + "model.layers.70.post_attention_layernorm.weight": "model-00108-of-00191.safetensors", + "model.layers.70.self_attn.k_proj.weight": "model-00106-of-00191.safetensors", + "model.layers.70.self_attn.o_proj.weight": "model-00106-of-00191.safetensors", + "model.layers.70.self_attn.q_proj.weight": "model-00106-of-00191.safetensors", + "model.layers.70.self_attn.v_proj.weight": "model-00106-of-00191.safetensors", + "model.layers.71.input_layernorm.weight": "model-00109-of-00191.safetensors", + "model.layers.71.mlp.down_proj.weight": "model-00109-of-00191.safetensors", + "model.layers.71.mlp.gate_proj.weight": "model-00108-of-00191.safetensors", + "model.layers.71.mlp.up_proj.weight": "model-00109-of-00191.safetensors", + "model.layers.71.post_attention_layernorm.weight": "model-00109-of-00191.safetensors", + "model.layers.71.self_attn.k_proj.weight": "model-00108-of-00191.safetensors", + "model.layers.71.self_attn.o_proj.weight": "model-00108-of-00191.safetensors", + "model.layers.71.self_attn.q_proj.weight": "model-00108-of-00191.safetensors", + "model.layers.71.self_attn.v_proj.weight": "model-00108-of-00191.safetensors", + "model.layers.72.input_layernorm.weight": "model-00111-of-00191.safetensors", + "model.layers.72.mlp.down_proj.weight": "model-00111-of-00191.safetensors", + "model.layers.72.mlp.gate_proj.weight": "model-00110-of-00191.safetensors", + "model.layers.72.mlp.up_proj.weight": "model-00110-of-00191.safetensors", + "model.layers.72.post_attention_layernorm.weight": "model-00111-of-00191.safetensors", + "model.layers.72.self_attn.k_proj.weight": "model-00109-of-00191.safetensors", + "model.layers.72.self_attn.o_proj.weight": "model-00109-of-00191.safetensors", + "model.layers.72.self_attn.q_proj.weight": "model-00109-of-00191.safetensors", + "model.layers.72.self_attn.v_proj.weight": "model-00109-of-00191.safetensors", + "model.layers.73.input_layernorm.weight": "model-00112-of-00191.safetensors", + "model.layers.73.mlp.down_proj.weight": "model-00112-of-00191.safetensors", + "model.layers.73.mlp.gate_proj.weight": "model-00111-of-00191.safetensors", + "model.layers.73.mlp.up_proj.weight": "model-00112-of-00191.safetensors", + "model.layers.73.post_attention_layernorm.weight": "model-00112-of-00191.safetensors", + "model.layers.73.self_attn.k_proj.weight": "model-00111-of-00191.safetensors", + "model.layers.73.self_attn.o_proj.weight": "model-00111-of-00191.safetensors", + "model.layers.73.self_attn.q_proj.weight": "model-00111-of-00191.safetensors", + "model.layers.73.self_attn.v_proj.weight": "model-00111-of-00191.safetensors", + "model.layers.74.input_layernorm.weight": "model-00114-of-00191.safetensors", + "model.layers.74.mlp.down_proj.weight": "model-00114-of-00191.safetensors", + "model.layers.74.mlp.gate_proj.weight": "model-00113-of-00191.safetensors", + "model.layers.74.mlp.up_proj.weight": "model-00113-of-00191.safetensors", + "model.layers.74.post_attention_layernorm.weight": "model-00114-of-00191.safetensors", + "model.layers.74.self_attn.k_proj.weight": "model-00112-of-00191.safetensors", + "model.layers.74.self_attn.o_proj.weight": "model-00112-of-00191.safetensors", + "model.layers.74.self_attn.q_proj.weight": "model-00112-of-00191.safetensors", + "model.layers.74.self_attn.v_proj.weight": "model-00112-of-00191.safetensors", + "model.layers.75.input_layernorm.weight": "model-00115-of-00191.safetensors", + "model.layers.75.mlp.down_proj.weight": "model-00115-of-00191.safetensors", + "model.layers.75.mlp.gate_proj.weight": "model-00114-of-00191.safetensors", + "model.layers.75.mlp.up_proj.weight": "model-00115-of-00191.safetensors", + "model.layers.75.post_attention_layernorm.weight": "model-00115-of-00191.safetensors", + "model.layers.75.self_attn.k_proj.weight": "model-00114-of-00191.safetensors", + "model.layers.75.self_attn.o_proj.weight": "model-00114-of-00191.safetensors", + "model.layers.75.self_attn.q_proj.weight": "model-00114-of-00191.safetensors", + "model.layers.75.self_attn.v_proj.weight": "model-00114-of-00191.safetensors", + "model.layers.76.input_layernorm.weight": "model-00117-of-00191.safetensors", + "model.layers.76.mlp.down_proj.weight": "model-00117-of-00191.safetensors", + "model.layers.76.mlp.gate_proj.weight": "model-00116-of-00191.safetensors", + "model.layers.76.mlp.up_proj.weight": "model-00116-of-00191.safetensors", + "model.layers.76.post_attention_layernorm.weight": "model-00117-of-00191.safetensors", + "model.layers.76.self_attn.k_proj.weight": "model-00115-of-00191.safetensors", + "model.layers.76.self_attn.o_proj.weight": "model-00115-of-00191.safetensors", + "model.layers.76.self_attn.q_proj.weight": "model-00115-of-00191.safetensors", + "model.layers.76.self_attn.v_proj.weight": "model-00115-of-00191.safetensors", + "model.layers.77.input_layernorm.weight": "model-00118-of-00191.safetensors", + "model.layers.77.mlp.down_proj.weight": "model-00118-of-00191.safetensors", + "model.layers.77.mlp.gate_proj.weight": "model-00117-of-00191.safetensors", + "model.layers.77.mlp.up_proj.weight": "model-00118-of-00191.safetensors", + "model.layers.77.post_attention_layernorm.weight": "model-00118-of-00191.safetensors", + "model.layers.77.self_attn.k_proj.weight": "model-00117-of-00191.safetensors", + "model.layers.77.self_attn.o_proj.weight": "model-00117-of-00191.safetensors", + "model.layers.77.self_attn.q_proj.weight": "model-00117-of-00191.safetensors", + "model.layers.77.self_attn.v_proj.weight": "model-00117-of-00191.safetensors", + "model.layers.78.input_layernorm.weight": "model-00120-of-00191.safetensors", + "model.layers.78.mlp.down_proj.weight": "model-00120-of-00191.safetensors", + "model.layers.78.mlp.gate_proj.weight": "model-00119-of-00191.safetensors", + "model.layers.78.mlp.up_proj.weight": "model-00119-of-00191.safetensors", + "model.layers.78.post_attention_layernorm.weight": "model-00120-of-00191.safetensors", + "model.layers.78.self_attn.k_proj.weight": "model-00118-of-00191.safetensors", + "model.layers.78.self_attn.o_proj.weight": "model-00118-of-00191.safetensors", + "model.layers.78.self_attn.q_proj.weight": "model-00118-of-00191.safetensors", + "model.layers.78.self_attn.v_proj.weight": "model-00118-of-00191.safetensors", + "model.layers.79.input_layernorm.weight": "model-00121-of-00191.safetensors", + "model.layers.79.mlp.down_proj.weight": "model-00121-of-00191.safetensors", + "model.layers.79.mlp.gate_proj.weight": "model-00120-of-00191.safetensors", + "model.layers.79.mlp.up_proj.weight": "model-00121-of-00191.safetensors", + "model.layers.79.post_attention_layernorm.weight": "model-00121-of-00191.safetensors", + "model.layers.79.self_attn.k_proj.weight": "model-00120-of-00191.safetensors", + "model.layers.79.self_attn.o_proj.weight": "model-00120-of-00191.safetensors", + "model.layers.79.self_attn.q_proj.weight": "model-00120-of-00191.safetensors", + "model.layers.79.self_attn.v_proj.weight": "model-00120-of-00191.safetensors", + "model.layers.8.input_layernorm.weight": "model-00015-of-00191.safetensors", + "model.layers.8.mlp.down_proj.weight": "model-00015-of-00191.safetensors", + "model.layers.8.mlp.gate_proj.weight": "model-00014-of-00191.safetensors", + "model.layers.8.mlp.up_proj.weight": "model-00014-of-00191.safetensors", + "model.layers.8.post_attention_layernorm.weight": "model-00015-of-00191.safetensors", + "model.layers.8.self_attn.k_proj.weight": "model-00013-of-00191.safetensors", + "model.layers.8.self_attn.o_proj.weight": "model-00013-of-00191.safetensors", + "model.layers.8.self_attn.q_proj.weight": "model-00013-of-00191.safetensors", + "model.layers.8.self_attn.v_proj.weight": "model-00013-of-00191.safetensors", + "model.layers.80.input_layernorm.weight": "model-00123-of-00191.safetensors", + "model.layers.80.mlp.down_proj.weight": "model-00123-of-00191.safetensors", + "model.layers.80.mlp.gate_proj.weight": "model-00122-of-00191.safetensors", + "model.layers.80.mlp.up_proj.weight": "model-00122-of-00191.safetensors", + "model.layers.80.post_attention_layernorm.weight": "model-00123-of-00191.safetensors", + "model.layers.80.self_attn.k_proj.weight": "model-00121-of-00191.safetensors", + "model.layers.80.self_attn.o_proj.weight": "model-00121-of-00191.safetensors", + "model.layers.80.self_attn.q_proj.weight": "model-00121-of-00191.safetensors", + "model.layers.80.self_attn.v_proj.weight": "model-00121-of-00191.safetensors", + "model.layers.81.input_layernorm.weight": "model-00124-of-00191.safetensors", + "model.layers.81.mlp.down_proj.weight": "model-00124-of-00191.safetensors", + "model.layers.81.mlp.gate_proj.weight": "model-00123-of-00191.safetensors", + "model.layers.81.mlp.up_proj.weight": "model-00124-of-00191.safetensors", + "model.layers.81.post_attention_layernorm.weight": "model-00124-of-00191.safetensors", + "model.layers.81.self_attn.k_proj.weight": "model-00123-of-00191.safetensors", + "model.layers.81.self_attn.o_proj.weight": "model-00123-of-00191.safetensors", + "model.layers.81.self_attn.q_proj.weight": "model-00123-of-00191.safetensors", + "model.layers.81.self_attn.v_proj.weight": "model-00123-of-00191.safetensors", + "model.layers.82.input_layernorm.weight": "model-00126-of-00191.safetensors", + "model.layers.82.mlp.down_proj.weight": "model-00126-of-00191.safetensors", + "model.layers.82.mlp.gate_proj.weight": "model-00125-of-00191.safetensors", + "model.layers.82.mlp.up_proj.weight": "model-00125-of-00191.safetensors", + "model.layers.82.post_attention_layernorm.weight": "model-00126-of-00191.safetensors", + "model.layers.82.self_attn.k_proj.weight": "model-00124-of-00191.safetensors", + "model.layers.82.self_attn.o_proj.weight": "model-00124-of-00191.safetensors", + "model.layers.82.self_attn.q_proj.weight": "model-00124-of-00191.safetensors", + "model.layers.82.self_attn.v_proj.weight": "model-00124-of-00191.safetensors", + "model.layers.83.input_layernorm.weight": "model-00127-of-00191.safetensors", + "model.layers.83.mlp.down_proj.weight": "model-00127-of-00191.safetensors", + "model.layers.83.mlp.gate_proj.weight": "model-00126-of-00191.safetensors", + "model.layers.83.mlp.up_proj.weight": "model-00127-of-00191.safetensors", + "model.layers.83.post_attention_layernorm.weight": "model-00127-of-00191.safetensors", + "model.layers.83.self_attn.k_proj.weight": "model-00126-of-00191.safetensors", + "model.layers.83.self_attn.o_proj.weight": "model-00126-of-00191.safetensors", + "model.layers.83.self_attn.q_proj.weight": "model-00126-of-00191.safetensors", + "model.layers.83.self_attn.v_proj.weight": "model-00126-of-00191.safetensors", + "model.layers.84.input_layernorm.weight": "model-00129-of-00191.safetensors", + "model.layers.84.mlp.down_proj.weight": "model-00129-of-00191.safetensors", + "model.layers.84.mlp.gate_proj.weight": "model-00128-of-00191.safetensors", + "model.layers.84.mlp.up_proj.weight": "model-00128-of-00191.safetensors", + "model.layers.84.post_attention_layernorm.weight": "model-00129-of-00191.safetensors", + "model.layers.84.self_attn.k_proj.weight": "model-00127-of-00191.safetensors", + "model.layers.84.self_attn.o_proj.weight": "model-00127-of-00191.safetensors", + "model.layers.84.self_attn.q_proj.weight": "model-00127-of-00191.safetensors", + "model.layers.84.self_attn.v_proj.weight": "model-00127-of-00191.safetensors", + "model.layers.85.input_layernorm.weight": "model-00130-of-00191.safetensors", + "model.layers.85.mlp.down_proj.weight": "model-00130-of-00191.safetensors", + "model.layers.85.mlp.gate_proj.weight": "model-00129-of-00191.safetensors", + "model.layers.85.mlp.up_proj.weight": "model-00130-of-00191.safetensors", + "model.layers.85.post_attention_layernorm.weight": "model-00130-of-00191.safetensors", + "model.layers.85.self_attn.k_proj.weight": "model-00129-of-00191.safetensors", + "model.layers.85.self_attn.o_proj.weight": "model-00129-of-00191.safetensors", + "model.layers.85.self_attn.q_proj.weight": "model-00129-of-00191.safetensors", + "model.layers.85.self_attn.v_proj.weight": "model-00129-of-00191.safetensors", + "model.layers.86.input_layernorm.weight": "model-00132-of-00191.safetensors", + "model.layers.86.mlp.down_proj.weight": "model-00132-of-00191.safetensors", + "model.layers.86.mlp.gate_proj.weight": "model-00131-of-00191.safetensors", + "model.layers.86.mlp.up_proj.weight": "model-00131-of-00191.safetensors", + "model.layers.86.post_attention_layernorm.weight": "model-00132-of-00191.safetensors", + "model.layers.86.self_attn.k_proj.weight": "model-00130-of-00191.safetensors", + "model.layers.86.self_attn.o_proj.weight": "model-00130-of-00191.safetensors", + "model.layers.86.self_attn.q_proj.weight": "model-00130-of-00191.safetensors", + "model.layers.86.self_attn.v_proj.weight": "model-00130-of-00191.safetensors", + "model.layers.87.input_layernorm.weight": "model-00133-of-00191.safetensors", + "model.layers.87.mlp.down_proj.weight": "model-00133-of-00191.safetensors", + "model.layers.87.mlp.gate_proj.weight": "model-00132-of-00191.safetensors", + "model.layers.87.mlp.up_proj.weight": "model-00133-of-00191.safetensors", + "model.layers.87.post_attention_layernorm.weight": "model-00133-of-00191.safetensors", + "model.layers.87.self_attn.k_proj.weight": "model-00132-of-00191.safetensors", + "model.layers.87.self_attn.o_proj.weight": "model-00132-of-00191.safetensors", + "model.layers.87.self_attn.q_proj.weight": "model-00132-of-00191.safetensors", + "model.layers.87.self_attn.v_proj.weight": "model-00132-of-00191.safetensors", + "model.layers.88.input_layernorm.weight": "model-00135-of-00191.safetensors", + "model.layers.88.mlp.down_proj.weight": "model-00135-of-00191.safetensors", + "model.layers.88.mlp.gate_proj.weight": "model-00134-of-00191.safetensors", + "model.layers.88.mlp.up_proj.weight": "model-00134-of-00191.safetensors", + "model.layers.88.post_attention_layernorm.weight": "model-00135-of-00191.safetensors", + "model.layers.88.self_attn.k_proj.weight": "model-00133-of-00191.safetensors", + "model.layers.88.self_attn.o_proj.weight": "model-00133-of-00191.safetensors", + "model.layers.88.self_attn.q_proj.weight": "model-00133-of-00191.safetensors", + "model.layers.88.self_attn.v_proj.weight": "model-00133-of-00191.safetensors", + "model.layers.89.input_layernorm.weight": "model-00136-of-00191.safetensors", + "model.layers.89.mlp.down_proj.weight": "model-00136-of-00191.safetensors", + "model.layers.89.mlp.gate_proj.weight": "model-00135-of-00191.safetensors", + "model.layers.89.mlp.up_proj.weight": "model-00136-of-00191.safetensors", + "model.layers.89.post_attention_layernorm.weight": "model-00136-of-00191.safetensors", + "model.layers.89.self_attn.k_proj.weight": "model-00135-of-00191.safetensors", + "model.layers.89.self_attn.o_proj.weight": "model-00135-of-00191.safetensors", + "model.layers.89.self_attn.q_proj.weight": "model-00135-of-00191.safetensors", + "model.layers.89.self_attn.v_proj.weight": "model-00135-of-00191.safetensors", + "model.layers.9.input_layernorm.weight": "model-00016-of-00191.safetensors", + "model.layers.9.mlp.down_proj.weight": "model-00016-of-00191.safetensors", + "model.layers.9.mlp.gate_proj.weight": "model-00015-of-00191.safetensors", + "model.layers.9.mlp.up_proj.weight": "model-00016-of-00191.safetensors", + "model.layers.9.post_attention_layernorm.weight": "model-00016-of-00191.safetensors", + "model.layers.9.self_attn.k_proj.weight": "model-00015-of-00191.safetensors", + "model.layers.9.self_attn.o_proj.weight": "model-00015-of-00191.safetensors", + "model.layers.9.self_attn.q_proj.weight": "model-00015-of-00191.safetensors", + "model.layers.9.self_attn.v_proj.weight": "model-00015-of-00191.safetensors", + "model.layers.90.input_layernorm.weight": "model-00138-of-00191.safetensors", + "model.layers.90.mlp.down_proj.weight": "model-00138-of-00191.safetensors", + "model.layers.90.mlp.gate_proj.weight": "model-00137-of-00191.safetensors", + "model.layers.90.mlp.up_proj.weight": "model-00137-of-00191.safetensors", + "model.layers.90.post_attention_layernorm.weight": "model-00138-of-00191.safetensors", + "model.layers.90.self_attn.k_proj.weight": "model-00136-of-00191.safetensors", + "model.layers.90.self_attn.o_proj.weight": "model-00136-of-00191.safetensors", + "model.layers.90.self_attn.q_proj.weight": "model-00136-of-00191.safetensors", + "model.layers.90.self_attn.v_proj.weight": "model-00136-of-00191.safetensors", + "model.layers.91.input_layernorm.weight": "model-00139-of-00191.safetensors", + "model.layers.91.mlp.down_proj.weight": "model-00139-of-00191.safetensors", + "model.layers.91.mlp.gate_proj.weight": "model-00138-of-00191.safetensors", + "model.layers.91.mlp.up_proj.weight": "model-00139-of-00191.safetensors", + "model.layers.91.post_attention_layernorm.weight": "model-00139-of-00191.safetensors", + "model.layers.91.self_attn.k_proj.weight": "model-00138-of-00191.safetensors", + "model.layers.91.self_attn.o_proj.weight": "model-00138-of-00191.safetensors", + "model.layers.91.self_attn.q_proj.weight": "model-00138-of-00191.safetensors", + "model.layers.91.self_attn.v_proj.weight": "model-00138-of-00191.safetensors", + "model.layers.92.input_layernorm.weight": "model-00141-of-00191.safetensors", + "model.layers.92.mlp.down_proj.weight": "model-00141-of-00191.safetensors", + "model.layers.92.mlp.gate_proj.weight": "model-00140-of-00191.safetensors", + "model.layers.92.mlp.up_proj.weight": "model-00140-of-00191.safetensors", + "model.layers.92.post_attention_layernorm.weight": "model-00141-of-00191.safetensors", + "model.layers.92.self_attn.k_proj.weight": "model-00139-of-00191.safetensors", + "model.layers.92.self_attn.o_proj.weight": "model-00139-of-00191.safetensors", + "model.layers.92.self_attn.q_proj.weight": "model-00139-of-00191.safetensors", + "model.layers.92.self_attn.v_proj.weight": "model-00139-of-00191.safetensors", + "model.layers.93.input_layernorm.weight": "model-00142-of-00191.safetensors", + "model.layers.93.mlp.down_proj.weight": "model-00142-of-00191.safetensors", + "model.layers.93.mlp.gate_proj.weight": "model-00141-of-00191.safetensors", + "model.layers.93.mlp.up_proj.weight": "model-00142-of-00191.safetensors", + "model.layers.93.post_attention_layernorm.weight": "model-00142-of-00191.safetensors", + "model.layers.93.self_attn.k_proj.weight": "model-00141-of-00191.safetensors", + "model.layers.93.self_attn.o_proj.weight": "model-00141-of-00191.safetensors", + "model.layers.93.self_attn.q_proj.weight": "model-00141-of-00191.safetensors", + "model.layers.93.self_attn.v_proj.weight": "model-00141-of-00191.safetensors", + "model.layers.94.input_layernorm.weight": "model-00144-of-00191.safetensors", + "model.layers.94.mlp.down_proj.weight": "model-00144-of-00191.safetensors", + "model.layers.94.mlp.gate_proj.weight": "model-00143-of-00191.safetensors", + "model.layers.94.mlp.up_proj.weight": "model-00143-of-00191.safetensors", + "model.layers.94.post_attention_layernorm.weight": "model-00144-of-00191.safetensors", + "model.layers.94.self_attn.k_proj.weight": "model-00142-of-00191.safetensors", + "model.layers.94.self_attn.o_proj.weight": "model-00142-of-00191.safetensors", + "model.layers.94.self_attn.q_proj.weight": "model-00142-of-00191.safetensors", + "model.layers.94.self_attn.v_proj.weight": "model-00142-of-00191.safetensors", + "model.layers.95.input_layernorm.weight": "model-00145-of-00191.safetensors", + "model.layers.95.mlp.down_proj.weight": "model-00145-of-00191.safetensors", + "model.layers.95.mlp.gate_proj.weight": "model-00144-of-00191.safetensors", + "model.layers.95.mlp.up_proj.weight": "model-00145-of-00191.safetensors", + "model.layers.95.post_attention_layernorm.weight": "model-00145-of-00191.safetensors", + "model.layers.95.self_attn.k_proj.weight": "model-00144-of-00191.safetensors", + "model.layers.95.self_attn.o_proj.weight": "model-00144-of-00191.safetensors", + "model.layers.95.self_attn.q_proj.weight": "model-00144-of-00191.safetensors", + "model.layers.95.self_attn.v_proj.weight": "model-00144-of-00191.safetensors", + "model.layers.96.input_layernorm.weight": "model-00147-of-00191.safetensors", + "model.layers.96.mlp.down_proj.weight": "model-00147-of-00191.safetensors", + "model.layers.96.mlp.gate_proj.weight": "model-00146-of-00191.safetensors", + "model.layers.96.mlp.up_proj.weight": "model-00146-of-00191.safetensors", + "model.layers.96.post_attention_layernorm.weight": "model-00147-of-00191.safetensors", + "model.layers.96.self_attn.k_proj.weight": "model-00145-of-00191.safetensors", + "model.layers.96.self_attn.o_proj.weight": "model-00145-of-00191.safetensors", + "model.layers.96.self_attn.q_proj.weight": "model-00145-of-00191.safetensors", + "model.layers.96.self_attn.v_proj.weight": "model-00145-of-00191.safetensors", + "model.layers.97.input_layernorm.weight": "model-00148-of-00191.safetensors", + "model.layers.97.mlp.down_proj.weight": "model-00148-of-00191.safetensors", + "model.layers.97.mlp.gate_proj.weight": "model-00147-of-00191.safetensors", + "model.layers.97.mlp.up_proj.weight": "model-00148-of-00191.safetensors", + "model.layers.97.post_attention_layernorm.weight": "model-00148-of-00191.safetensors", + "model.layers.97.self_attn.k_proj.weight": "model-00147-of-00191.safetensors", + "model.layers.97.self_attn.o_proj.weight": "model-00147-of-00191.safetensors", + "model.layers.97.self_attn.q_proj.weight": "model-00147-of-00191.safetensors", + "model.layers.97.self_attn.v_proj.weight": "model-00147-of-00191.safetensors", + "model.layers.98.input_layernorm.weight": "model-00150-of-00191.safetensors", + "model.layers.98.mlp.down_proj.weight": "model-00150-of-00191.safetensors", + "model.layers.98.mlp.gate_proj.weight": "model-00149-of-00191.safetensors", + "model.layers.98.mlp.up_proj.weight": "model-00149-of-00191.safetensors", + "model.layers.98.post_attention_layernorm.weight": "model-00150-of-00191.safetensors", + "model.layers.98.self_attn.k_proj.weight": "model-00148-of-00191.safetensors", + "model.layers.98.self_attn.o_proj.weight": "model-00148-of-00191.safetensors", + "model.layers.98.self_attn.q_proj.weight": "model-00148-of-00191.safetensors", + "model.layers.98.self_attn.v_proj.weight": "model-00148-of-00191.safetensors", + "model.layers.99.input_layernorm.weight": "model-00151-of-00191.safetensors", + "model.layers.99.mlp.down_proj.weight": "model-00151-of-00191.safetensors", + "model.layers.99.mlp.gate_proj.weight": "model-00150-of-00191.safetensors", + "model.layers.99.mlp.up_proj.weight": "model-00151-of-00191.safetensors", + "model.layers.99.post_attention_layernorm.weight": "model-00151-of-00191.safetensors", + "model.layers.99.self_attn.k_proj.weight": "model-00150-of-00191.safetensors", + "model.layers.99.self_attn.o_proj.weight": "model-00150-of-00191.safetensors", + "model.layers.99.self_attn.q_proj.weight": "model-00150-of-00191.safetensors", + "model.layers.99.self_attn.v_proj.weight": "model-00150-of-00191.safetensors", + "model.norm.weight": "model-00190-of-00191.safetensors" + } +} diff --git a/tokenizer_config.json b/tokenizer_config.json index 0c5aa98e634b25ace0dcab50795241dc159b00c5..ef8218534a4cd20717275b6ae849b35d4821ba1d 100644 --- a/tokenizer_config.json +++ b/tokenizer_config.json @@ -2061,6 +2061,7 @@ "chat_template": "{% for message in messages %}{% if message['role'] == 'system' %}{{ '<|system|>\n' + message['content'] + '\n' }}{% elif message['role'] == 'user' %}{{ '<|user|>\n' + message['content'] + '\n' }}{% elif message['role'] == 'assistant' %}{% if not loop.last %}{{ '<|assistant|>\n' + message['content'] + eos_token + '\n' }}{% else %}{{ '<|assistant|>\n' + message['content'] + eos_token }}{% endif %}{% endif %}{% if loop.last and add_generation_prompt %}{{ '<|assistant|>\n' }}{% endif %}{% endfor %}", "clean_up_tokenization_spaces": true, "eos_token": "<|end_of_text|>", + "extra_special_tokens": {}, "model_input_names": [ "input_ids", "attention_mask"