diff --git a/config.json b/config.json new file mode 100644 index 0000000000000000000000000000000000000000..222b1665094fd01d39a1817ac2cc5973efa55eff --- /dev/null +++ b/config.json @@ -0,0 +1 @@ +{"architectures": ["LLaMAForCausalLM"], "bos_token_id": 0, "eos_token_id": 1, "hidden_act": "silu", "hidden_size": 8192, "intermediate_size": 22016, "initializer_range": 0.02, "max_sequence_length": 2048, "model_type": "llama", "num_attention_heads": 64, "num_hidden_layers": 80, "pad_token_id": -1, "rms_norm_eps": 1e-05, "torch_dtype": "float16", "transformers_version": "4.27.0.dev0", "use_cache": true, "vocab_size": 32000} \ No newline at end of file diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000000000000000000000000000000000000..8fdfba7b10dbe7d959d961b28f9e67433c0c0e9c --- /dev/null +++ b/generation_config.json @@ -0,0 +1 @@ +{"_from_model_config": true, "bos_token_id": 0, "eos_token_id": 1, "pad_token_id": -1, "transformers_version": "4.27.0.dev0"} \ No newline at end of file diff --git a/pytorch_model-00000-of-00081.bin b/pytorch_model-00000-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..0e4ce66e7713e87c98e5c2737ee2927b148463b8 --- /dev/null +++ b/pytorch_model-00000-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68fc9bee12edadf7b7ac8aab6d2a37cb0d77cf1e545e7347afde02b2d50ea9bb +size 1619038147 diff --git a/pytorch_model-00001-of-00081.bin b/pytorch_model-00001-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..5a6de4b47dfb825d0f7ca137ed6d9a29590cd6c4 --- /dev/null +++ b/pytorch_model-00001-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e4424704779d18cd4aa2c40a97240a7cec1cfd111f8cb5295f387394c55b988 +size 1619038147 diff --git a/pytorch_model-00002-of-00081.bin b/pytorch_model-00002-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..76408c06b87eb3f4f0bea678d06b37b4d7163352 --- /dev/null +++ b/pytorch_model-00002-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:992226e23e5792a94db58cba6e71e7b622519028cf9789a82fdd96b8ea65367d +size 1619038147 diff --git a/pytorch_model-00003-of-00081.bin b/pytorch_model-00003-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..3347802c68fc4e6ba335e8fe1afc2d069fd5a29d --- /dev/null +++ b/pytorch_model-00003-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f704b112af33c646dc15196c5c48b8e30b4eb16e9fe7e0f4f7d8893c8cfac5ad +size 1619038147 diff --git a/pytorch_model-00004-of-00081.bin b/pytorch_model-00004-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..84a441407053228be00bfc7bc031fd0a3ddbc915 --- /dev/null +++ b/pytorch_model-00004-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb6f48fca191dd96eb4f4799035e703d2c3763a4792245f84ffaf23f56223bca +size 1619038147 diff --git a/pytorch_model-00005-of-00081.bin b/pytorch_model-00005-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..61a958b1cee96c65b36029cad212a0fd1c829a1e --- /dev/null +++ b/pytorch_model-00005-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbde79ae57c5739c2937feca6b27ad266256648cd916ad99098a5f815ad95721 +size 1619038147 diff --git a/pytorch_model-00006-of-00081.bin b/pytorch_model-00006-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..00f989b7c8302e0092f6d681b39dba925f48f4b7 --- /dev/null +++ b/pytorch_model-00006-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3132d5a3fdfcb27c63f11cd80bd9c481ed374d86ca308704e2bb3f9b2f230f09 +size 1619038147 diff --git a/pytorch_model-00007-of-00081.bin b/pytorch_model-00007-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..005e292c59482dc9ae79325f18683437f7641d0e --- /dev/null +++ b/pytorch_model-00007-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74e419fd164c2b87137f3e12dc2eebcab223a840a2fa2d87fd50a9950533889b +size 1619038147 diff --git a/pytorch_model-00008-of-00081.bin b/pytorch_model-00008-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..44c154b8ffb8bd38a7f7ab2de4ce93cc29cbbe6e --- /dev/null +++ b/pytorch_model-00008-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:626b5c8d2c77dece91751cbe1ff3e8388485524fdbd4602835260efea1e04aae +size 1619038147 diff --git a/pytorch_model-00009-of-00081.bin b/pytorch_model-00009-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..e49b85e368055114944b48de4c63cd1454ff0768 --- /dev/null +++ b/pytorch_model-00009-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc39d6390f7b54f3d21230d51c98ed2155666f9486e236800e0392447342dd96 +size 1619038147 diff --git a/pytorch_model-00010-of-00081.bin b/pytorch_model-00010-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..a8fac9b1df506eb38726906c4e3693f9982524ac --- /dev/null +++ b/pytorch_model-00010-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfba454a7511bb30131557eb95e6ddd47bc7769d11c93ccb29e2750694d37eed +size 1619038147 diff --git a/pytorch_model-00011-of-00081.bin b/pytorch_model-00011-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..539005343034258035972c4da83a55fc68d03846 --- /dev/null +++ b/pytorch_model-00011-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8611ed94ebd5a257c9c5b5ce4e450a234064b21ff2aa327e1eef84c94bb22bc +size 1619038147 diff --git a/pytorch_model-00012-of-00081.bin b/pytorch_model-00012-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..d04236745f07b356b4fa46b59dffea15f4ca169e --- /dev/null +++ b/pytorch_model-00012-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bc0c7a90367231e1618be75dc8f454c653b8d6fee7bcae7eabf92a5d5ad5df1 +size 1619038147 diff --git a/pytorch_model-00013-of-00081.bin b/pytorch_model-00013-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..c0ec3ec9577551e886ab34b78fbe2916578e69e4 --- /dev/null +++ b/pytorch_model-00013-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb0b4c04217eac3b80e7ee7811f96926ddfdbe0dc7bebf319c352c29889b4b40 +size 1619038147 diff --git a/pytorch_model-00014-of-00081.bin b/pytorch_model-00014-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..ec6c798829158ba21fec45824dab1e7b8b173acc --- /dev/null +++ b/pytorch_model-00014-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:682f19ad023ec912264ec688b209670639b11e7e4c919bbe868a7edf1fb21e3d +size 1619038147 diff --git a/pytorch_model-00015-of-00081.bin b/pytorch_model-00015-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..797e9d7dfdf5430adcd473f2c307ac18842cc865 --- /dev/null +++ b/pytorch_model-00015-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a39a09887541df6c46dd500a764bbaaceb099da95170466f46506d9b6a21ad98 +size 1619038147 diff --git a/pytorch_model-00016-of-00081.bin b/pytorch_model-00016-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..d6761cc9ccf492c87f8e6160b292feb5def4dae1 --- /dev/null +++ b/pytorch_model-00016-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67e4e1a7c89b8fe451b1352161210f54a9547a3be12183ce77686ffb2d0278db +size 1619038147 diff --git a/pytorch_model-00017-of-00081.bin b/pytorch_model-00017-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..b864b235bec7c168b4f003e5f13524bde8c3b314 --- /dev/null +++ b/pytorch_model-00017-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a98c8c083366566a6acf1b147db47f876cec8bf7af54ea2d38f55e3225c31527 +size 1619038147 diff --git a/pytorch_model-00018-of-00081.bin b/pytorch_model-00018-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..22ef10efbf1ee68f1e8115b5d9f9ae276d8b72b0 --- /dev/null +++ b/pytorch_model-00018-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1c589361d5bef9b0f337b629ea8179a91be78a6710a9217deb0299eed9b0c8a +size 1619038147 diff --git a/pytorch_model-00019-of-00081.bin b/pytorch_model-00019-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..ec5f062cc78245c6c8bce1b144b6597f1dfe8860 --- /dev/null +++ b/pytorch_model-00019-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a7ad8a72f3b8f1cc872da92dbdfffbce854d919ade3af21d86c212bbb2077b1 +size 1619038147 diff --git a/pytorch_model-00020-of-00081.bin b/pytorch_model-00020-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..61707f87137bc58eec529043a9dbb0a95ccf57fa --- /dev/null +++ b/pytorch_model-00020-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a52100d1bd5049cdbf0a9d8bdde2c42f23f3aca1e2126ded2eaf043de195d0c4 +size 1619038147 diff --git a/pytorch_model-00021-of-00081.bin b/pytorch_model-00021-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..9446339106f1f1fe5b1dd9a63e8dbad952d3029e --- /dev/null +++ b/pytorch_model-00021-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c14af88aa227e58a295c4971a2bb466b8d1d3917970c3c0eb4739879d35014ed +size 1619038147 diff --git a/pytorch_model-00022-of-00081.bin b/pytorch_model-00022-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..fed86773e528b48b2036e96fd4f50a532d2c4455 --- /dev/null +++ b/pytorch_model-00022-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd6e0952402bb0ec361222904a8457ab00a922a24c37407a2ef5104a5f3cc34a +size 1619038147 diff --git a/pytorch_model-00023-of-00081.bin b/pytorch_model-00023-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..e9a2dfe0ccad772c93b559a982ce6c589bbdf44f --- /dev/null +++ b/pytorch_model-00023-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bb4927a000c9a736cb75f615253d12380ce22f7b5ef5eb19f8e5782f8083156 +size 1619038147 diff --git a/pytorch_model-00024-of-00081.bin b/pytorch_model-00024-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..7becefd945f88a7503de8bee34d01ac09767c6c7 --- /dev/null +++ b/pytorch_model-00024-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04c4183304a5bc53238db2d3ded505fa228aca0f5fa75f3b5ac6b58b76687531 +size 1619038147 diff --git a/pytorch_model-00025-of-00081.bin b/pytorch_model-00025-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..a833523f5e8fa9fd8264550fe183e61504dfdb2e --- /dev/null +++ b/pytorch_model-00025-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e350c5fc7c8107f1ad0da1e844744ae7fa6eec2e9a13db29867c04abbfcf8edf +size 1619038147 diff --git a/pytorch_model-00026-of-00081.bin b/pytorch_model-00026-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..fc75eb0b42ff8950dd3add95ea71c692b28cb9f9 --- /dev/null +++ b/pytorch_model-00026-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49021681467370427b77be8ef7a1a902afbcdb64eec5d13091441cb135abba72 +size 1619038147 diff --git a/pytorch_model-00027-of-00081.bin b/pytorch_model-00027-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..3a8237814ee05bb647bf3055651273e1a4626d53 --- /dev/null +++ b/pytorch_model-00027-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:309c323b85fddfcdc60991c80bea10744bdc689d6cdae35fd01a633b1f8f2ce5 +size 1619038147 diff --git a/pytorch_model-00028-of-00081.bin b/pytorch_model-00028-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..90fbb74687c646ca1e674914855fc20b29f49415 --- /dev/null +++ b/pytorch_model-00028-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58d3ff03fe53a3d536ab148f09df6d3746a09f2faefcb9450dcac14a092f3c57 +size 1619038147 diff --git a/pytorch_model-00029-of-00081.bin b/pytorch_model-00029-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..a0afb45ca9924982dfae39db8b8e283471bda2ea --- /dev/null +++ b/pytorch_model-00029-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf1da9d5389ef1082a7dd97a297aac9a06e53855c1d92dd86fc2736882c412a1 +size 1619038147 diff --git a/pytorch_model-00030-of-00081.bin b/pytorch_model-00030-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..4a0b77a20580e8f463a32ddfa266697cb2e4f69b --- /dev/null +++ b/pytorch_model-00030-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8171f0190f587552dfe90439504bceb73dbf8dbe4f310cfbf03b6a01293324a4 +size 1619038147 diff --git a/pytorch_model-00031-of-00081.bin b/pytorch_model-00031-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..64727d44ac3d6810068d1328debe71cf59cc48c6 --- /dev/null +++ b/pytorch_model-00031-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02465f86597d7a946d8808a6e050b7a8145a3965075069d63c4c021120d526f6 +size 1619038147 diff --git a/pytorch_model-00032-of-00081.bin b/pytorch_model-00032-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..1efaccf775935ef8e2a6ef08a8ee2f642399127d --- /dev/null +++ b/pytorch_model-00032-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbb5d84bf672bd0ce80b705e4021153fd1d1560c277c06e7047d97feb95e83dc +size 1619038147 diff --git a/pytorch_model-00033-of-00081.bin b/pytorch_model-00033-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..31a277196cb986c836871fc76101cde8dd53a89a --- /dev/null +++ b/pytorch_model-00033-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8459f18ee7039d110e36e28c1db1fb589795a7e1c92c09d507cb3c5cea4cd29 +size 1619038147 diff --git a/pytorch_model-00034-of-00081.bin b/pytorch_model-00034-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..a0f034b76de5fc1d02deb72b61356b1534037cf5 --- /dev/null +++ b/pytorch_model-00034-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7adb382c4fa1c39633a9d59761deca71a9ef27ffbb0172aeadc4c6edcdbf0c66 +size 1619038147 diff --git a/pytorch_model-00035-of-00081.bin b/pytorch_model-00035-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..33bc848e5221890d8ab3f5fb58d7155fd5546c75 --- /dev/null +++ b/pytorch_model-00035-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2f8ec0a0aa8fcbe93e09db51cc8de7cfa37d57f024c918dad03155d0a406128 +size 1619038147 diff --git a/pytorch_model-00036-of-00081.bin b/pytorch_model-00036-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..14beee5216421155a5a6cc22cedfcc622a17e755 --- /dev/null +++ b/pytorch_model-00036-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:429a37e53ca2e25b777c9a9a4c14094673199be16b750c8ebb3cb30640d9fde5 +size 1619038147 diff --git a/pytorch_model-00037-of-00081.bin b/pytorch_model-00037-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..8acc78548f2775623461c9ea16a5ef6f65f58b5d --- /dev/null +++ b/pytorch_model-00037-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6d9288ab246f6f98930255116de2ff7ce3adb5f80112b6628f577b7dfd2407b +size 1619038147 diff --git a/pytorch_model-00038-of-00081.bin b/pytorch_model-00038-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..e84900469a538f9d1e033b48af630b4873ad23da --- /dev/null +++ b/pytorch_model-00038-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80e49eb3c0a4fd8ad099b66c191eead9caeebb6f46cad5cbee49e6c9fc4efbef +size 1619038147 diff --git a/pytorch_model-00039-of-00081.bin b/pytorch_model-00039-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..e061e801250be8288d4db759116231ca8ef79be1 --- /dev/null +++ b/pytorch_model-00039-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df25b5d3dbc283e8ef06b457e3c13e780ee1677e811b92defa5994dc30ec094a +size 1619038147 diff --git a/pytorch_model-00040-of-00081.bin b/pytorch_model-00040-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..3a6216c8fd8516fb45daf35f0aba1b128c0d5904 --- /dev/null +++ b/pytorch_model-00040-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc993d38a3af7257edb1709d828558d3f5431d430e2f1c0351f06423db5649f6 +size 1619038147 diff --git a/pytorch_model-00041-of-00081.bin b/pytorch_model-00041-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..651a5577e075c4fafa2e22670cb2b45f6be96b8d --- /dev/null +++ b/pytorch_model-00041-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cc28c1b015b820ef9c340bdd2d45ca4e944dd7919938181aeee33aa2df9a79d +size 1619038147 diff --git a/pytorch_model-00042-of-00081.bin b/pytorch_model-00042-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..415b0e1786734edf605fa3ff41968ea51db37c24 --- /dev/null +++ b/pytorch_model-00042-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:464c757272ed68f90ba93eb56f2f98f9959ac8873f563f16182d80e5d600a285 +size 1619038147 diff --git a/pytorch_model-00043-of-00081.bin b/pytorch_model-00043-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..c5fc0d95efe479330c3b0ceab5ffc341e7be18f6 --- /dev/null +++ b/pytorch_model-00043-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d0731f1d9ce877043be1bd71563b589fef9d138f5bb8e8236f57a14ecc0dad7 +size 1619038147 diff --git a/pytorch_model-00044-of-00081.bin b/pytorch_model-00044-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..f4cf98e69746f5047e28d92ab21ba23818fea691 --- /dev/null +++ b/pytorch_model-00044-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e27726dab9b8722223a8aad87a77e8e9385e5ea35d4d7bafffb6c49e6f650c97 +size 1619038147 diff --git a/pytorch_model-00045-of-00081.bin b/pytorch_model-00045-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..9d44bd38abfb67af5da9aa7f7934c20f2d857129 --- /dev/null +++ b/pytorch_model-00045-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:576e74192d1acbcb76fac8c591f91e497197f34ee5077c25bfb6d8db5e2b8587 +size 1619038147 diff --git a/pytorch_model-00046-of-00081.bin b/pytorch_model-00046-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..9c16007adf5627b6a71ba952d9d8f9eb0402f447 --- /dev/null +++ b/pytorch_model-00046-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e7eb7eb735582b9e82fdcc8b3db69e46539833d398bee37db1ec9e9b1de3ad8 +size 1619038147 diff --git a/pytorch_model-00047-of-00081.bin b/pytorch_model-00047-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..92858d34fc9fbab0d35d697a6e02d5c0255b205c --- /dev/null +++ b/pytorch_model-00047-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0738e7958db6213f37b0d3d33df44999540407170267d9f2e5c3e1d80d8bdf65 +size 1619038147 diff --git a/pytorch_model-00048-of-00081.bin b/pytorch_model-00048-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..0a77984713a776ea26c6a211b515f769ebae8cd9 --- /dev/null +++ b/pytorch_model-00048-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea4359d5a1873f95fbf55c8759e8dc3c7bf335c92b3c6310db426732df7e39b1 +size 1619038147 diff --git a/pytorch_model-00049-of-00081.bin b/pytorch_model-00049-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..79fab86ab0354ac769ede9c6df57edff6b01236a --- /dev/null +++ b/pytorch_model-00049-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:320b5c20a0c66b40c0777792187366144a3bb93a670776021fdcb7e79905f90b +size 1619038147 diff --git a/pytorch_model-00050-of-00081.bin b/pytorch_model-00050-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..1737e227e2a3ba89bdcfd705bd45b947a0e4d9a0 --- /dev/null +++ b/pytorch_model-00050-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd58259451287c91a533fd5e320abcf7ff3c47f81da3beb032e859fabcef0728 +size 1619038147 diff --git a/pytorch_model-00051-of-00081.bin b/pytorch_model-00051-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..2612e7f4b901cf0b0a94b8199dd50a338bb7b24f --- /dev/null +++ b/pytorch_model-00051-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e038c831e849d6a6d32f2f17f5cc720081de2007fe48330ea2fd31f5ca7e15ec +size 1619038147 diff --git a/pytorch_model-00052-of-00081.bin b/pytorch_model-00052-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..529ce21b21acd40203c8affe176bf65178db5c07 --- /dev/null +++ b/pytorch_model-00052-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45e1753a797f10a205a8ad3a03f6e9b0a402a996b0afa9c318bf8bf182e1ed59 +size 1619038147 diff --git a/pytorch_model-00053-of-00081.bin b/pytorch_model-00053-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..c77caa03896c9efafefc0b47ef54bc00d693ac58 --- /dev/null +++ b/pytorch_model-00053-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1763274615daebbd5679e3a80bff1bbc03a7cce7a66e61843d66c00b1e8644f6 +size 1619038147 diff --git a/pytorch_model-00054-of-00081.bin b/pytorch_model-00054-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..084a364599f052f5e7c92c20aa3e628004d0c2ce --- /dev/null +++ b/pytorch_model-00054-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbc43a7d018d4bd89d5ccfa72c657a6aee0d048bd44b5329bb2525fe73b94d5a +size 1619038147 diff --git a/pytorch_model-00055-of-00081.bin b/pytorch_model-00055-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..bf6dc8e226388c4a747652fee8963c24688223fd --- /dev/null +++ b/pytorch_model-00055-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:848a9720924472c01fa76e1de9e491dfdc47fd97f8779284c976b3339772b248 +size 1619038147 diff --git a/pytorch_model-00056-of-00081.bin b/pytorch_model-00056-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..dcc8cab2afbecba37a3976a5d122238dc5d3bc0d --- /dev/null +++ b/pytorch_model-00056-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7f2e20d579cf836d2196d6440c4d9f69671a80ecb7aa0a89f4086b7926232f8 +size 1619038147 diff --git a/pytorch_model-00057-of-00081.bin b/pytorch_model-00057-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..30ca95ff5dfede3a06383d2567b5c2f126b377c6 --- /dev/null +++ b/pytorch_model-00057-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39bdb13878d1a6be1b1f6483a406dabd9ec00c811edb431bb7f47f00fdc27579 +size 1619038147 diff --git a/pytorch_model-00058-of-00081.bin b/pytorch_model-00058-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..f5fa3c2f3f5c7663438042ac8b8a611aba89ce7b --- /dev/null +++ b/pytorch_model-00058-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ac63eb9ab45ad3a3fcdc11164caded92fd5adb5c1fd21c1b6f591bf06d6206d +size 1619038147 diff --git a/pytorch_model-00059-of-00081.bin b/pytorch_model-00059-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..c00da65c35557c31b33bce7ea4024b148a0b901b --- /dev/null +++ b/pytorch_model-00059-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:227c1cc1986fd1d783cfe106d60e79adda2d0d814bc8cf3cb97ebfed1bc8b9bb +size 1619038147 diff --git a/pytorch_model-00060-of-00081.bin b/pytorch_model-00060-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..09b7441ee92f865d6c546c2e37287f6f90a2d71b --- /dev/null +++ b/pytorch_model-00060-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc57c5aba30adaf3b603be81fa86aca28c92e7f7984d455e1c0f69bb65c22be4 +size 1619038147 diff --git a/pytorch_model-00061-of-00081.bin b/pytorch_model-00061-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..944d2eb89375819c49a315b98478aba5b1298a7a --- /dev/null +++ b/pytorch_model-00061-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50f752d906540e6cdca0082abdb7a1c089f9710d70e1ee832ab33ed0d2c1c4e0 +size 1619038147 diff --git a/pytorch_model-00062-of-00081.bin b/pytorch_model-00062-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..77f91c32d116617cc0fd4337dc1a34ebf1f16bc7 --- /dev/null +++ b/pytorch_model-00062-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f38c3c3ecef40fc2f9492a6563181786acc668079df0c11e4678fa3267c7192 +size 1619038147 diff --git a/pytorch_model-00063-of-00081.bin b/pytorch_model-00063-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..5276bd8d8d12611302c4b3d8fad7f3ef4dd73ebc --- /dev/null +++ b/pytorch_model-00063-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdde4ff4923f7d00c4dd9a9834e1df22c45d7f2a750bf2d12fd477f872f23be6 +size 1619038147 diff --git a/pytorch_model-00064-of-00081.bin b/pytorch_model-00064-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..7ef13cf9f4aef18a64df12c776362b491a54103e --- /dev/null +++ b/pytorch_model-00064-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c684410bfa6a4c459bdbe5042b8a4039705aa7392d467acdcc958966161c4418 +size 1619038147 diff --git a/pytorch_model-00065-of-00081.bin b/pytorch_model-00065-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..af5f4de6e576f53551f47b6c48036ed248e9c885 --- /dev/null +++ b/pytorch_model-00065-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af069a5fadd085784f2796865fe50a04b8479453c91411a24f9c589b6d7eec15 +size 1619038147 diff --git a/pytorch_model-00066-of-00081.bin b/pytorch_model-00066-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..288697db9da63d0d44b7fe4cfcf55d197fae2b29 --- /dev/null +++ b/pytorch_model-00066-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e00e3c4b6a7287fd8054dbddce269d5cbf74a4bc80c037b58fc2d869120b8cc5 +size 1619038147 diff --git a/pytorch_model-00067-of-00081.bin b/pytorch_model-00067-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..fda71a40c474765e46a58ddc4ddeef15b0e262e0 --- /dev/null +++ b/pytorch_model-00067-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef50f4869fe4e38389bf3dffd3f18a26cf7105ba8e31617b4143d60e6e9742fc +size 1619038147 diff --git a/pytorch_model-00068-of-00081.bin b/pytorch_model-00068-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..0512ce2ed778c0aa1cd09166501da1d5d9c18ef4 --- /dev/null +++ b/pytorch_model-00068-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60512d0e307de19719d1966881f249d6a323821d535f6348c57b6e82a33bed29 +size 1619038147 diff --git a/pytorch_model-00069-of-00081.bin b/pytorch_model-00069-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..fb80d247aa9ceafc7771469a3ce4d0cff818316a --- /dev/null +++ b/pytorch_model-00069-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fe14358bc73324dd854a4f0c9b9737745dd164501f2b0170c552650f1ecffeb +size 1619038147 diff --git a/pytorch_model-00070-of-00081.bin b/pytorch_model-00070-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..a68275a46704356f13a72d89e408c02047e32774 --- /dev/null +++ b/pytorch_model-00070-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:133d33ce71c691bd24343a7553af44b54188065a26b134ffc36d445144ade701 +size 1619038147 diff --git a/pytorch_model-00071-of-00081.bin b/pytorch_model-00071-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..1e0e31391a0799c035ab97c78495956a43f01ed0 --- /dev/null +++ b/pytorch_model-00071-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49f329a817a860a63ce413db93f2bcd56778db7daea84e835dccabb7e6135a05 +size 1619038147 diff --git a/pytorch_model-00072-of-00081.bin b/pytorch_model-00072-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..9b021019bedb03c85c1164f4be24c3942dcaea28 --- /dev/null +++ b/pytorch_model-00072-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:832743355615bb2b10efb73e055dab8e582c4741a75c6130eea798e5074d8463 +size 1619038147 diff --git a/pytorch_model-00073-of-00081.bin b/pytorch_model-00073-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..e59e0a2abc178af59a7821901037129e0116aa99 --- /dev/null +++ b/pytorch_model-00073-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:193088cf36dfd3baf803b10274f020366ecc14892c1602c412be119e3576ee1f +size 1619038147 diff --git a/pytorch_model-00074-of-00081.bin b/pytorch_model-00074-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..c6985381938f7c299a0456967484b6cd9fc64c18 --- /dev/null +++ b/pytorch_model-00074-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d0c9599bbcad80c79dc6088d20a6d706ef53dbfd7b3fc7f8c7eab71cd8da1d5 +size 1619038147 diff --git a/pytorch_model-00075-of-00081.bin b/pytorch_model-00075-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..980620b2c8f53d4a518a86f0ff76e256fdd4caee --- /dev/null +++ b/pytorch_model-00075-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f21a1b9a77bb29e89869ddfd34fc8c1ec347c997cca91a057ca5aeb23acbbdc8 +size 1619038147 diff --git a/pytorch_model-00076-of-00081.bin b/pytorch_model-00076-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..00ce42916b43433de10a0bd181a58e61240a6bd0 --- /dev/null +++ b/pytorch_model-00076-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc0ce23c2a9f208c97c0ca806d23b2d839eed2f05b01017f0ce3015e0c98d92f +size 1619038147 diff --git a/pytorch_model-00077-of-00081.bin b/pytorch_model-00077-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..2bc961cd227626f9e6afcc3855460b7cd5e7b4c1 --- /dev/null +++ b/pytorch_model-00077-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8927b6115a8420ec978cad717483430d37b57dc8aa253109b6c3f533072127d5 +size 1619038147 diff --git a/pytorch_model-00078-of-00081.bin b/pytorch_model-00078-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..8a7f346e6626ca897da65c6066899b2514ffefa9 --- /dev/null +++ b/pytorch_model-00078-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbde7755b19511eed20ba5cac81f56e1d8194c9ae8ffc5720b36004e8a2fd33b +size 1619038147 diff --git a/pytorch_model-00079-of-00081.bin b/pytorch_model-00079-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..84286ab6dd73cf745200c78432c7ed87c7ddac74 --- /dev/null +++ b/pytorch_model-00079-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:928347e3feebacf07d8d69a7a5ce7e0f35aacbfa8c05aa8458ce129a87c3866e +size 1619038147 diff --git a/pytorch_model-00080-of-00081.bin b/pytorch_model-00080-of-00081.bin new file mode 100644 index 0000000000000000000000000000000000000000..4bba52fd02501cb269eb8cb8cc80ee720bfad7d9 --- /dev/null +++ b/pytorch_model-00080-of-00081.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:490e45ab89817a82477f9d25713159d84f26ea3c8a3eaf5da60ecda0551cd425 +size 1048593868 diff --git a/pytorch_model.bin.index.json b/pytorch_model.bin.index.json new file mode 100644 index 0000000000000000000000000000000000000000..ffc6353d6744dbd90c3e72284e2c2284dfaa9a87 --- /dev/null +++ b/pytorch_model.bin.index.json @@ -0,0 +1 @@ +{"weight_map": {"model.layers.0.input_layernorm.weight": "pytorch_model-00000-of-00081.bin", "model.layers.0.post_attention_layernorm.weight": "pytorch_model-00000-of-00081.bin", "model.layers.0.self_attn.q_proj.weight": "pytorch_model-00000-of-00081.bin", "model.layers.0.self_attn.k_proj.weight": "pytorch_model-00000-of-00081.bin", "model.layers.0.self_attn.v_proj.weight": "pytorch_model-00000-of-00081.bin", "model.layers.0.self_attn.o_proj.weight": "pytorch_model-00000-of-00081.bin", "model.layers.0.mlp.gate_proj.weight": "pytorch_model-00000-of-00081.bin", "model.layers.0.mlp.down_proj.weight": "pytorch_model-00000-of-00081.bin", "model.layers.0.mlp.up_proj.weight": "pytorch_model-00000-of-00081.bin", "model.layers.0.self_attn.rotary_emb.inv_freq": "pytorch_model-00000-of-00081.bin", "model.layers.1.input_layernorm.weight": "pytorch_model-00001-of-00081.bin", "model.layers.1.post_attention_layernorm.weight": "pytorch_model-00001-of-00081.bin", "model.layers.1.self_attn.q_proj.weight": "pytorch_model-00001-of-00081.bin", "model.layers.1.self_attn.k_proj.weight": "pytorch_model-00001-of-00081.bin", "model.layers.1.self_attn.v_proj.weight": "pytorch_model-00001-of-00081.bin", "model.layers.1.self_attn.o_proj.weight": "pytorch_model-00001-of-00081.bin", "model.layers.1.mlp.gate_proj.weight": "pytorch_model-00001-of-00081.bin", "model.layers.1.mlp.down_proj.weight": "pytorch_model-00001-of-00081.bin", "model.layers.1.mlp.up_proj.weight": "pytorch_model-00001-of-00081.bin", "model.layers.1.self_attn.rotary_emb.inv_freq": "pytorch_model-00001-of-00081.bin", "model.layers.2.input_layernorm.weight": "pytorch_model-00002-of-00081.bin", "model.layers.2.post_attention_layernorm.weight": "pytorch_model-00002-of-00081.bin", "model.layers.2.self_attn.q_proj.weight": "pytorch_model-00002-of-00081.bin", "model.layers.2.self_attn.k_proj.weight": "pytorch_model-00002-of-00081.bin", "model.layers.2.self_attn.v_proj.weight": "pytorch_model-00002-of-00081.bin", "model.layers.2.self_attn.o_proj.weight": "pytorch_model-00002-of-00081.bin", "model.layers.2.mlp.gate_proj.weight": "pytorch_model-00002-of-00081.bin", "model.layers.2.mlp.down_proj.weight": "pytorch_model-00002-of-00081.bin", "model.layers.2.mlp.up_proj.weight": "pytorch_model-00002-of-00081.bin", "model.layers.2.self_attn.rotary_emb.inv_freq": "pytorch_model-00002-of-00081.bin", "model.layers.3.input_layernorm.weight": "pytorch_model-00003-of-00081.bin", "model.layers.3.post_attention_layernorm.weight": "pytorch_model-00003-of-00081.bin", "model.layers.3.self_attn.q_proj.weight": "pytorch_model-00003-of-00081.bin", "model.layers.3.self_attn.k_proj.weight": "pytorch_model-00003-of-00081.bin", "model.layers.3.self_attn.v_proj.weight": "pytorch_model-00003-of-00081.bin", "model.layers.3.self_attn.o_proj.weight": "pytorch_model-00003-of-00081.bin", "model.layers.3.mlp.gate_proj.weight": "pytorch_model-00003-of-00081.bin", "model.layers.3.mlp.down_proj.weight": "pytorch_model-00003-of-00081.bin", "model.layers.3.mlp.up_proj.weight": "pytorch_model-00003-of-00081.bin", "model.layers.3.self_attn.rotary_emb.inv_freq": "pytorch_model-00003-of-00081.bin", "model.layers.4.input_layernorm.weight": "pytorch_model-00004-of-00081.bin", "model.layers.4.post_attention_layernorm.weight": "pytorch_model-00004-of-00081.bin", "model.layers.4.self_attn.q_proj.weight": "pytorch_model-00004-of-00081.bin", "model.layers.4.self_attn.k_proj.weight": "pytorch_model-00004-of-00081.bin", "model.layers.4.self_attn.v_proj.weight": "pytorch_model-00004-of-00081.bin", "model.layers.4.self_attn.o_proj.weight": "pytorch_model-00004-of-00081.bin", "model.layers.4.mlp.gate_proj.weight": "pytorch_model-00004-of-00081.bin", "model.layers.4.mlp.down_proj.weight": "pytorch_model-00004-of-00081.bin", "model.layers.4.mlp.up_proj.weight": "pytorch_model-00004-of-00081.bin", "model.layers.4.self_attn.rotary_emb.inv_freq": "pytorch_model-00004-of-00081.bin", "model.layers.5.input_layernorm.weight": "pytorch_model-00005-of-00081.bin", "model.layers.5.post_attention_layernorm.weight": "pytorch_model-00005-of-00081.bin", "model.layers.5.self_attn.q_proj.weight": "pytorch_model-00005-of-00081.bin", "model.layers.5.self_attn.k_proj.weight": "pytorch_model-00005-of-00081.bin", "model.layers.5.self_attn.v_proj.weight": "pytorch_model-00005-of-00081.bin", "model.layers.5.self_attn.o_proj.weight": "pytorch_model-00005-of-00081.bin", "model.layers.5.mlp.gate_proj.weight": "pytorch_model-00005-of-00081.bin", "model.layers.5.mlp.down_proj.weight": "pytorch_model-00005-of-00081.bin", "model.layers.5.mlp.up_proj.weight": "pytorch_model-00005-of-00081.bin", "model.layers.5.self_attn.rotary_emb.inv_freq": "pytorch_model-00005-of-00081.bin", "model.layers.6.input_layernorm.weight": "pytorch_model-00006-of-00081.bin", "model.layers.6.post_attention_layernorm.weight": "pytorch_model-00006-of-00081.bin", "model.layers.6.self_attn.q_proj.weight": "pytorch_model-00006-of-00081.bin", "model.layers.6.self_attn.k_proj.weight": "pytorch_model-00006-of-00081.bin", "model.layers.6.self_attn.v_proj.weight": "pytorch_model-00006-of-00081.bin", "model.layers.6.self_attn.o_proj.weight": "pytorch_model-00006-of-00081.bin", "model.layers.6.mlp.gate_proj.weight": "pytorch_model-00006-of-00081.bin", "model.layers.6.mlp.down_proj.weight": "pytorch_model-00006-of-00081.bin", "model.layers.6.mlp.up_proj.weight": "pytorch_model-00006-of-00081.bin", "model.layers.6.self_attn.rotary_emb.inv_freq": "pytorch_model-00006-of-00081.bin", "model.layers.7.input_layernorm.weight": "pytorch_model-00007-of-00081.bin", "model.layers.7.post_attention_layernorm.weight": "pytorch_model-00007-of-00081.bin", "model.layers.7.self_attn.q_proj.weight": "pytorch_model-00007-of-00081.bin", "model.layers.7.self_attn.k_proj.weight": "pytorch_model-00007-of-00081.bin", "model.layers.7.self_attn.v_proj.weight": "pytorch_model-00007-of-00081.bin", "model.layers.7.self_attn.o_proj.weight": "pytorch_model-00007-of-00081.bin", "model.layers.7.mlp.gate_proj.weight": "pytorch_model-00007-of-00081.bin", "model.layers.7.mlp.down_proj.weight": "pytorch_model-00007-of-00081.bin", "model.layers.7.mlp.up_proj.weight": "pytorch_model-00007-of-00081.bin", "model.layers.7.self_attn.rotary_emb.inv_freq": "pytorch_model-00007-of-00081.bin", "model.layers.8.input_layernorm.weight": "pytorch_model-00008-of-00081.bin", "model.layers.8.post_attention_layernorm.weight": "pytorch_model-00008-of-00081.bin", "model.layers.8.self_attn.q_proj.weight": "pytorch_model-00008-of-00081.bin", "model.layers.8.self_attn.k_proj.weight": "pytorch_model-00008-of-00081.bin", "model.layers.8.self_attn.v_proj.weight": "pytorch_model-00008-of-00081.bin", "model.layers.8.self_attn.o_proj.weight": "pytorch_model-00008-of-00081.bin", "model.layers.8.mlp.gate_proj.weight": "pytorch_model-00008-of-00081.bin", "model.layers.8.mlp.down_proj.weight": "pytorch_model-00008-of-00081.bin", "model.layers.8.mlp.up_proj.weight": "pytorch_model-00008-of-00081.bin", "model.layers.8.self_attn.rotary_emb.inv_freq": "pytorch_model-00008-of-00081.bin", "model.layers.9.input_layernorm.weight": "pytorch_model-00009-of-00081.bin", "model.layers.9.post_attention_layernorm.weight": "pytorch_model-00009-of-00081.bin", "model.layers.9.self_attn.q_proj.weight": "pytorch_model-00009-of-00081.bin", "model.layers.9.self_attn.k_proj.weight": "pytorch_model-00009-of-00081.bin", "model.layers.9.self_attn.v_proj.weight": "pytorch_model-00009-of-00081.bin", "model.layers.9.self_attn.o_proj.weight": "pytorch_model-00009-of-00081.bin", "model.layers.9.mlp.gate_proj.weight": "pytorch_model-00009-of-00081.bin", "model.layers.9.mlp.down_proj.weight": "pytorch_model-00009-of-00081.bin", "model.layers.9.mlp.up_proj.weight": "pytorch_model-00009-of-00081.bin", "model.layers.9.self_attn.rotary_emb.inv_freq": "pytorch_model-00009-of-00081.bin", "model.layers.10.input_layernorm.weight": "pytorch_model-00010-of-00081.bin", "model.layers.10.post_attention_layernorm.weight": "pytorch_model-00010-of-00081.bin", "model.layers.10.self_attn.q_proj.weight": "pytorch_model-00010-of-00081.bin", "model.layers.10.self_attn.k_proj.weight": "pytorch_model-00010-of-00081.bin", "model.layers.10.self_attn.v_proj.weight": "pytorch_model-00010-of-00081.bin", "model.layers.10.self_attn.o_proj.weight": "pytorch_model-00010-of-00081.bin", "model.layers.10.mlp.gate_proj.weight": "pytorch_model-00010-of-00081.bin", "model.layers.10.mlp.down_proj.weight": "pytorch_model-00010-of-00081.bin", "model.layers.10.mlp.up_proj.weight": "pytorch_model-00010-of-00081.bin", "model.layers.10.self_attn.rotary_emb.inv_freq": "pytorch_model-00010-of-00081.bin", "model.layers.11.input_layernorm.weight": "pytorch_model-00011-of-00081.bin", "model.layers.11.post_attention_layernorm.weight": "pytorch_model-00011-of-00081.bin", "model.layers.11.self_attn.q_proj.weight": "pytorch_model-00011-of-00081.bin", "model.layers.11.self_attn.k_proj.weight": "pytorch_model-00011-of-00081.bin", "model.layers.11.self_attn.v_proj.weight": "pytorch_model-00011-of-00081.bin", "model.layers.11.self_attn.o_proj.weight": "pytorch_model-00011-of-00081.bin", "model.layers.11.mlp.gate_proj.weight": "pytorch_model-00011-of-00081.bin", "model.layers.11.mlp.down_proj.weight": "pytorch_model-00011-of-00081.bin", "model.layers.11.mlp.up_proj.weight": "pytorch_model-00011-of-00081.bin", "model.layers.11.self_attn.rotary_emb.inv_freq": "pytorch_model-00011-of-00081.bin", "model.layers.12.input_layernorm.weight": "pytorch_model-00012-of-00081.bin", "model.layers.12.post_attention_layernorm.weight": "pytorch_model-00012-of-00081.bin", "model.layers.12.self_attn.q_proj.weight": "pytorch_model-00012-of-00081.bin", "model.layers.12.self_attn.k_proj.weight": "pytorch_model-00012-of-00081.bin", "model.layers.12.self_attn.v_proj.weight": "pytorch_model-00012-of-00081.bin", "model.layers.12.self_attn.o_proj.weight": "pytorch_model-00012-of-00081.bin", "model.layers.12.mlp.gate_proj.weight": "pytorch_model-00012-of-00081.bin", "model.layers.12.mlp.down_proj.weight": "pytorch_model-00012-of-00081.bin", "model.layers.12.mlp.up_proj.weight": "pytorch_model-00012-of-00081.bin", "model.layers.12.self_attn.rotary_emb.inv_freq": "pytorch_model-00012-of-00081.bin", "model.layers.13.input_layernorm.weight": "pytorch_model-00013-of-00081.bin", "model.layers.13.post_attention_layernorm.weight": "pytorch_model-00013-of-00081.bin", "model.layers.13.self_attn.q_proj.weight": "pytorch_model-00013-of-00081.bin", "model.layers.13.self_attn.k_proj.weight": "pytorch_model-00013-of-00081.bin", "model.layers.13.self_attn.v_proj.weight": "pytorch_model-00013-of-00081.bin", "model.layers.13.self_attn.o_proj.weight": "pytorch_model-00013-of-00081.bin", "model.layers.13.mlp.gate_proj.weight": "pytorch_model-00013-of-00081.bin", "model.layers.13.mlp.down_proj.weight": "pytorch_model-00013-of-00081.bin", "model.layers.13.mlp.up_proj.weight": "pytorch_model-00013-of-00081.bin", "model.layers.13.self_attn.rotary_emb.inv_freq": "pytorch_model-00013-of-00081.bin", "model.layers.14.input_layernorm.weight": "pytorch_model-00014-of-00081.bin", "model.layers.14.post_attention_layernorm.weight": "pytorch_model-00014-of-00081.bin", "model.layers.14.self_attn.q_proj.weight": "pytorch_model-00014-of-00081.bin", "model.layers.14.self_attn.k_proj.weight": "pytorch_model-00014-of-00081.bin", "model.layers.14.self_attn.v_proj.weight": "pytorch_model-00014-of-00081.bin", "model.layers.14.self_attn.o_proj.weight": "pytorch_model-00014-of-00081.bin", "model.layers.14.mlp.gate_proj.weight": "pytorch_model-00014-of-00081.bin", "model.layers.14.mlp.down_proj.weight": "pytorch_model-00014-of-00081.bin", "model.layers.14.mlp.up_proj.weight": "pytorch_model-00014-of-00081.bin", "model.layers.14.self_attn.rotary_emb.inv_freq": "pytorch_model-00014-of-00081.bin", "model.layers.15.input_layernorm.weight": "pytorch_model-00015-of-00081.bin", "model.layers.15.post_attention_layernorm.weight": "pytorch_model-00015-of-00081.bin", "model.layers.15.self_attn.q_proj.weight": "pytorch_model-00015-of-00081.bin", "model.layers.15.self_attn.k_proj.weight": "pytorch_model-00015-of-00081.bin", "model.layers.15.self_attn.v_proj.weight": "pytorch_model-00015-of-00081.bin", "model.layers.15.self_attn.o_proj.weight": "pytorch_model-00015-of-00081.bin", "model.layers.15.mlp.gate_proj.weight": "pytorch_model-00015-of-00081.bin", "model.layers.15.mlp.down_proj.weight": "pytorch_model-00015-of-00081.bin", "model.layers.15.mlp.up_proj.weight": "pytorch_model-00015-of-00081.bin", "model.layers.15.self_attn.rotary_emb.inv_freq": "pytorch_model-00015-of-00081.bin", "model.layers.16.input_layernorm.weight": "pytorch_model-00016-of-00081.bin", "model.layers.16.post_attention_layernorm.weight": "pytorch_model-00016-of-00081.bin", "model.layers.16.self_attn.q_proj.weight": "pytorch_model-00016-of-00081.bin", "model.layers.16.self_attn.k_proj.weight": "pytorch_model-00016-of-00081.bin", "model.layers.16.self_attn.v_proj.weight": "pytorch_model-00016-of-00081.bin", "model.layers.16.self_attn.o_proj.weight": "pytorch_model-00016-of-00081.bin", "model.layers.16.mlp.gate_proj.weight": "pytorch_model-00016-of-00081.bin", "model.layers.16.mlp.down_proj.weight": "pytorch_model-00016-of-00081.bin", "model.layers.16.mlp.up_proj.weight": "pytorch_model-00016-of-00081.bin", "model.layers.16.self_attn.rotary_emb.inv_freq": "pytorch_model-00016-of-00081.bin", "model.layers.17.input_layernorm.weight": "pytorch_model-00017-of-00081.bin", "model.layers.17.post_attention_layernorm.weight": "pytorch_model-00017-of-00081.bin", "model.layers.17.self_attn.q_proj.weight": "pytorch_model-00017-of-00081.bin", "model.layers.17.self_attn.k_proj.weight": "pytorch_model-00017-of-00081.bin", "model.layers.17.self_attn.v_proj.weight": "pytorch_model-00017-of-00081.bin", "model.layers.17.self_attn.o_proj.weight": "pytorch_model-00017-of-00081.bin", "model.layers.17.mlp.gate_proj.weight": "pytorch_model-00017-of-00081.bin", "model.layers.17.mlp.down_proj.weight": "pytorch_model-00017-of-00081.bin", "model.layers.17.mlp.up_proj.weight": "pytorch_model-00017-of-00081.bin", "model.layers.17.self_attn.rotary_emb.inv_freq": "pytorch_model-00017-of-00081.bin", "model.layers.18.input_layernorm.weight": "pytorch_model-00018-of-00081.bin", "model.layers.18.post_attention_layernorm.weight": "pytorch_model-00018-of-00081.bin", "model.layers.18.self_attn.q_proj.weight": "pytorch_model-00018-of-00081.bin", "model.layers.18.self_attn.k_proj.weight": "pytorch_model-00018-of-00081.bin", "model.layers.18.self_attn.v_proj.weight": "pytorch_model-00018-of-00081.bin", "model.layers.18.self_attn.o_proj.weight": "pytorch_model-00018-of-00081.bin", "model.layers.18.mlp.gate_proj.weight": "pytorch_model-00018-of-00081.bin", "model.layers.18.mlp.down_proj.weight": "pytorch_model-00018-of-00081.bin", "model.layers.18.mlp.up_proj.weight": "pytorch_model-00018-of-00081.bin", "model.layers.18.self_attn.rotary_emb.inv_freq": "pytorch_model-00018-of-00081.bin", "model.layers.19.input_layernorm.weight": "pytorch_model-00019-of-00081.bin", "model.layers.19.post_attention_layernorm.weight": "pytorch_model-00019-of-00081.bin", "model.layers.19.self_attn.q_proj.weight": "pytorch_model-00019-of-00081.bin", "model.layers.19.self_attn.k_proj.weight": "pytorch_model-00019-of-00081.bin", "model.layers.19.self_attn.v_proj.weight": "pytorch_model-00019-of-00081.bin", "model.layers.19.self_attn.o_proj.weight": "pytorch_model-00019-of-00081.bin", "model.layers.19.mlp.gate_proj.weight": "pytorch_model-00019-of-00081.bin", "model.layers.19.mlp.down_proj.weight": "pytorch_model-00019-of-00081.bin", "model.layers.19.mlp.up_proj.weight": "pytorch_model-00019-of-00081.bin", "model.layers.19.self_attn.rotary_emb.inv_freq": "pytorch_model-00019-of-00081.bin", "model.layers.20.input_layernorm.weight": "pytorch_model-00020-of-00081.bin", "model.layers.20.post_attention_layernorm.weight": "pytorch_model-00020-of-00081.bin", "model.layers.20.self_attn.q_proj.weight": "pytorch_model-00020-of-00081.bin", "model.layers.20.self_attn.k_proj.weight": "pytorch_model-00020-of-00081.bin", "model.layers.20.self_attn.v_proj.weight": "pytorch_model-00020-of-00081.bin", "model.layers.20.self_attn.o_proj.weight": "pytorch_model-00020-of-00081.bin", "model.layers.20.mlp.gate_proj.weight": "pytorch_model-00020-of-00081.bin", "model.layers.20.mlp.down_proj.weight": "pytorch_model-00020-of-00081.bin", "model.layers.20.mlp.up_proj.weight": "pytorch_model-00020-of-00081.bin", "model.layers.20.self_attn.rotary_emb.inv_freq": "pytorch_model-00020-of-00081.bin", "model.layers.21.input_layernorm.weight": "pytorch_model-00021-of-00081.bin", "model.layers.21.post_attention_layernorm.weight": "pytorch_model-00021-of-00081.bin", "model.layers.21.self_attn.q_proj.weight": "pytorch_model-00021-of-00081.bin", "model.layers.21.self_attn.k_proj.weight": "pytorch_model-00021-of-00081.bin", "model.layers.21.self_attn.v_proj.weight": "pytorch_model-00021-of-00081.bin", "model.layers.21.self_attn.o_proj.weight": "pytorch_model-00021-of-00081.bin", "model.layers.21.mlp.gate_proj.weight": "pytorch_model-00021-of-00081.bin", "model.layers.21.mlp.down_proj.weight": "pytorch_model-00021-of-00081.bin", "model.layers.21.mlp.up_proj.weight": "pytorch_model-00021-of-00081.bin", "model.layers.21.self_attn.rotary_emb.inv_freq": "pytorch_model-00021-of-00081.bin", "model.layers.22.input_layernorm.weight": "pytorch_model-00022-of-00081.bin", "model.layers.22.post_attention_layernorm.weight": "pytorch_model-00022-of-00081.bin", "model.layers.22.self_attn.q_proj.weight": "pytorch_model-00022-of-00081.bin", "model.layers.22.self_attn.k_proj.weight": "pytorch_model-00022-of-00081.bin", "model.layers.22.self_attn.v_proj.weight": "pytorch_model-00022-of-00081.bin", "model.layers.22.self_attn.o_proj.weight": "pytorch_model-00022-of-00081.bin", "model.layers.22.mlp.gate_proj.weight": "pytorch_model-00022-of-00081.bin", "model.layers.22.mlp.down_proj.weight": "pytorch_model-00022-of-00081.bin", "model.layers.22.mlp.up_proj.weight": "pytorch_model-00022-of-00081.bin", "model.layers.22.self_attn.rotary_emb.inv_freq": "pytorch_model-00022-of-00081.bin", "model.layers.23.input_layernorm.weight": "pytorch_model-00023-of-00081.bin", "model.layers.23.post_attention_layernorm.weight": "pytorch_model-00023-of-00081.bin", "model.layers.23.self_attn.q_proj.weight": "pytorch_model-00023-of-00081.bin", "model.layers.23.self_attn.k_proj.weight": "pytorch_model-00023-of-00081.bin", "model.layers.23.self_attn.v_proj.weight": "pytorch_model-00023-of-00081.bin", "model.layers.23.self_attn.o_proj.weight": "pytorch_model-00023-of-00081.bin", "model.layers.23.mlp.gate_proj.weight": "pytorch_model-00023-of-00081.bin", "model.layers.23.mlp.down_proj.weight": "pytorch_model-00023-of-00081.bin", "model.layers.23.mlp.up_proj.weight": "pytorch_model-00023-of-00081.bin", "model.layers.23.self_attn.rotary_emb.inv_freq": "pytorch_model-00023-of-00081.bin", "model.layers.24.input_layernorm.weight": "pytorch_model-00024-of-00081.bin", "model.layers.24.post_attention_layernorm.weight": "pytorch_model-00024-of-00081.bin", "model.layers.24.self_attn.q_proj.weight": "pytorch_model-00024-of-00081.bin", "model.layers.24.self_attn.k_proj.weight": "pytorch_model-00024-of-00081.bin", "model.layers.24.self_attn.v_proj.weight": "pytorch_model-00024-of-00081.bin", "model.layers.24.self_attn.o_proj.weight": "pytorch_model-00024-of-00081.bin", "model.layers.24.mlp.gate_proj.weight": "pytorch_model-00024-of-00081.bin", "model.layers.24.mlp.down_proj.weight": "pytorch_model-00024-of-00081.bin", "model.layers.24.mlp.up_proj.weight": "pytorch_model-00024-of-00081.bin", "model.layers.24.self_attn.rotary_emb.inv_freq": "pytorch_model-00024-of-00081.bin", "model.layers.25.input_layernorm.weight": "pytorch_model-00025-of-00081.bin", "model.layers.25.post_attention_layernorm.weight": "pytorch_model-00025-of-00081.bin", "model.layers.25.self_attn.q_proj.weight": "pytorch_model-00025-of-00081.bin", "model.layers.25.self_attn.k_proj.weight": "pytorch_model-00025-of-00081.bin", "model.layers.25.self_attn.v_proj.weight": "pytorch_model-00025-of-00081.bin", "model.layers.25.self_attn.o_proj.weight": "pytorch_model-00025-of-00081.bin", "model.layers.25.mlp.gate_proj.weight": "pytorch_model-00025-of-00081.bin", "model.layers.25.mlp.down_proj.weight": "pytorch_model-00025-of-00081.bin", "model.layers.25.mlp.up_proj.weight": "pytorch_model-00025-of-00081.bin", "model.layers.25.self_attn.rotary_emb.inv_freq": "pytorch_model-00025-of-00081.bin", "model.layers.26.input_layernorm.weight": "pytorch_model-00026-of-00081.bin", "model.layers.26.post_attention_layernorm.weight": "pytorch_model-00026-of-00081.bin", "model.layers.26.self_attn.q_proj.weight": "pytorch_model-00026-of-00081.bin", "model.layers.26.self_attn.k_proj.weight": "pytorch_model-00026-of-00081.bin", "model.layers.26.self_attn.v_proj.weight": "pytorch_model-00026-of-00081.bin", "model.layers.26.self_attn.o_proj.weight": "pytorch_model-00026-of-00081.bin", "model.layers.26.mlp.gate_proj.weight": "pytorch_model-00026-of-00081.bin", "model.layers.26.mlp.down_proj.weight": "pytorch_model-00026-of-00081.bin", "model.layers.26.mlp.up_proj.weight": "pytorch_model-00026-of-00081.bin", "model.layers.26.self_attn.rotary_emb.inv_freq": "pytorch_model-00026-of-00081.bin", "model.layers.27.input_layernorm.weight": "pytorch_model-00027-of-00081.bin", "model.layers.27.post_attention_layernorm.weight": "pytorch_model-00027-of-00081.bin", "model.layers.27.self_attn.q_proj.weight": "pytorch_model-00027-of-00081.bin", "model.layers.27.self_attn.k_proj.weight": "pytorch_model-00027-of-00081.bin", "model.layers.27.self_attn.v_proj.weight": "pytorch_model-00027-of-00081.bin", "model.layers.27.self_attn.o_proj.weight": "pytorch_model-00027-of-00081.bin", "model.layers.27.mlp.gate_proj.weight": "pytorch_model-00027-of-00081.bin", "model.layers.27.mlp.down_proj.weight": "pytorch_model-00027-of-00081.bin", "model.layers.27.mlp.up_proj.weight": "pytorch_model-00027-of-00081.bin", "model.layers.27.self_attn.rotary_emb.inv_freq": "pytorch_model-00027-of-00081.bin", "model.layers.28.input_layernorm.weight": "pytorch_model-00028-of-00081.bin", "model.layers.28.post_attention_layernorm.weight": "pytorch_model-00028-of-00081.bin", "model.layers.28.self_attn.q_proj.weight": "pytorch_model-00028-of-00081.bin", "model.layers.28.self_attn.k_proj.weight": "pytorch_model-00028-of-00081.bin", "model.layers.28.self_attn.v_proj.weight": "pytorch_model-00028-of-00081.bin", "model.layers.28.self_attn.o_proj.weight": "pytorch_model-00028-of-00081.bin", "model.layers.28.mlp.gate_proj.weight": "pytorch_model-00028-of-00081.bin", "model.layers.28.mlp.down_proj.weight": "pytorch_model-00028-of-00081.bin", "model.layers.28.mlp.up_proj.weight": "pytorch_model-00028-of-00081.bin", "model.layers.28.self_attn.rotary_emb.inv_freq": "pytorch_model-00028-of-00081.bin", "model.layers.29.input_layernorm.weight": "pytorch_model-00029-of-00081.bin", "model.layers.29.post_attention_layernorm.weight": "pytorch_model-00029-of-00081.bin", "model.layers.29.self_attn.q_proj.weight": "pytorch_model-00029-of-00081.bin", "model.layers.29.self_attn.k_proj.weight": "pytorch_model-00029-of-00081.bin", "model.layers.29.self_attn.v_proj.weight": "pytorch_model-00029-of-00081.bin", "model.layers.29.self_attn.o_proj.weight": "pytorch_model-00029-of-00081.bin", "model.layers.29.mlp.gate_proj.weight": "pytorch_model-00029-of-00081.bin", "model.layers.29.mlp.down_proj.weight": "pytorch_model-00029-of-00081.bin", "model.layers.29.mlp.up_proj.weight": "pytorch_model-00029-of-00081.bin", "model.layers.29.self_attn.rotary_emb.inv_freq": "pytorch_model-00029-of-00081.bin", "model.layers.30.input_layernorm.weight": "pytorch_model-00030-of-00081.bin", "model.layers.30.post_attention_layernorm.weight": "pytorch_model-00030-of-00081.bin", "model.layers.30.self_attn.q_proj.weight": "pytorch_model-00030-of-00081.bin", "model.layers.30.self_attn.k_proj.weight": "pytorch_model-00030-of-00081.bin", "model.layers.30.self_attn.v_proj.weight": "pytorch_model-00030-of-00081.bin", "model.layers.30.self_attn.o_proj.weight": "pytorch_model-00030-of-00081.bin", "model.layers.30.mlp.gate_proj.weight": "pytorch_model-00030-of-00081.bin", "model.layers.30.mlp.down_proj.weight": "pytorch_model-00030-of-00081.bin", "model.layers.30.mlp.up_proj.weight": "pytorch_model-00030-of-00081.bin", "model.layers.30.self_attn.rotary_emb.inv_freq": "pytorch_model-00030-of-00081.bin", "model.layers.31.input_layernorm.weight": "pytorch_model-00031-of-00081.bin", "model.layers.31.post_attention_layernorm.weight": "pytorch_model-00031-of-00081.bin", "model.layers.31.self_attn.q_proj.weight": "pytorch_model-00031-of-00081.bin", "model.layers.31.self_attn.k_proj.weight": "pytorch_model-00031-of-00081.bin", "model.layers.31.self_attn.v_proj.weight": "pytorch_model-00031-of-00081.bin", "model.layers.31.self_attn.o_proj.weight": "pytorch_model-00031-of-00081.bin", "model.layers.31.mlp.gate_proj.weight": "pytorch_model-00031-of-00081.bin", "model.layers.31.mlp.down_proj.weight": "pytorch_model-00031-of-00081.bin", "model.layers.31.mlp.up_proj.weight": "pytorch_model-00031-of-00081.bin", "model.layers.31.self_attn.rotary_emb.inv_freq": "pytorch_model-00031-of-00081.bin", "model.layers.32.input_layernorm.weight": "pytorch_model-00032-of-00081.bin", "model.layers.32.post_attention_layernorm.weight": "pytorch_model-00032-of-00081.bin", "model.layers.32.self_attn.q_proj.weight": "pytorch_model-00032-of-00081.bin", "model.layers.32.self_attn.k_proj.weight": "pytorch_model-00032-of-00081.bin", "model.layers.32.self_attn.v_proj.weight": "pytorch_model-00032-of-00081.bin", "model.layers.32.self_attn.o_proj.weight": "pytorch_model-00032-of-00081.bin", "model.layers.32.mlp.gate_proj.weight": "pytorch_model-00032-of-00081.bin", "model.layers.32.mlp.down_proj.weight": "pytorch_model-00032-of-00081.bin", "model.layers.32.mlp.up_proj.weight": "pytorch_model-00032-of-00081.bin", "model.layers.32.self_attn.rotary_emb.inv_freq": "pytorch_model-00032-of-00081.bin", "model.layers.33.input_layernorm.weight": "pytorch_model-00033-of-00081.bin", "model.layers.33.post_attention_layernorm.weight": "pytorch_model-00033-of-00081.bin", "model.layers.33.self_attn.q_proj.weight": "pytorch_model-00033-of-00081.bin", "model.layers.33.self_attn.k_proj.weight": "pytorch_model-00033-of-00081.bin", "model.layers.33.self_attn.v_proj.weight": "pytorch_model-00033-of-00081.bin", "model.layers.33.self_attn.o_proj.weight": "pytorch_model-00033-of-00081.bin", "model.layers.33.mlp.gate_proj.weight": "pytorch_model-00033-of-00081.bin", "model.layers.33.mlp.down_proj.weight": "pytorch_model-00033-of-00081.bin", "model.layers.33.mlp.up_proj.weight": "pytorch_model-00033-of-00081.bin", "model.layers.33.self_attn.rotary_emb.inv_freq": "pytorch_model-00033-of-00081.bin", "model.layers.34.input_layernorm.weight": "pytorch_model-00034-of-00081.bin", "model.layers.34.post_attention_layernorm.weight": "pytorch_model-00034-of-00081.bin", "model.layers.34.self_attn.q_proj.weight": "pytorch_model-00034-of-00081.bin", "model.layers.34.self_attn.k_proj.weight": "pytorch_model-00034-of-00081.bin", "model.layers.34.self_attn.v_proj.weight": "pytorch_model-00034-of-00081.bin", "model.layers.34.self_attn.o_proj.weight": "pytorch_model-00034-of-00081.bin", "model.layers.34.mlp.gate_proj.weight": "pytorch_model-00034-of-00081.bin", "model.layers.34.mlp.down_proj.weight": "pytorch_model-00034-of-00081.bin", "model.layers.34.mlp.up_proj.weight": "pytorch_model-00034-of-00081.bin", "model.layers.34.self_attn.rotary_emb.inv_freq": "pytorch_model-00034-of-00081.bin", "model.layers.35.input_layernorm.weight": "pytorch_model-00035-of-00081.bin", "model.layers.35.post_attention_layernorm.weight": "pytorch_model-00035-of-00081.bin", "model.layers.35.self_attn.q_proj.weight": "pytorch_model-00035-of-00081.bin", "model.layers.35.self_attn.k_proj.weight": "pytorch_model-00035-of-00081.bin", "model.layers.35.self_attn.v_proj.weight": "pytorch_model-00035-of-00081.bin", "model.layers.35.self_attn.o_proj.weight": "pytorch_model-00035-of-00081.bin", "model.layers.35.mlp.gate_proj.weight": "pytorch_model-00035-of-00081.bin", "model.layers.35.mlp.down_proj.weight": "pytorch_model-00035-of-00081.bin", "model.layers.35.mlp.up_proj.weight": "pytorch_model-00035-of-00081.bin", "model.layers.35.self_attn.rotary_emb.inv_freq": "pytorch_model-00035-of-00081.bin", "model.layers.36.input_layernorm.weight": "pytorch_model-00036-of-00081.bin", "model.layers.36.post_attention_layernorm.weight": "pytorch_model-00036-of-00081.bin", "model.layers.36.self_attn.q_proj.weight": "pytorch_model-00036-of-00081.bin", "model.layers.36.self_attn.k_proj.weight": "pytorch_model-00036-of-00081.bin", "model.layers.36.self_attn.v_proj.weight": "pytorch_model-00036-of-00081.bin", "model.layers.36.self_attn.o_proj.weight": "pytorch_model-00036-of-00081.bin", "model.layers.36.mlp.gate_proj.weight": "pytorch_model-00036-of-00081.bin", "model.layers.36.mlp.down_proj.weight": "pytorch_model-00036-of-00081.bin", "model.layers.36.mlp.up_proj.weight": "pytorch_model-00036-of-00081.bin", "model.layers.36.self_attn.rotary_emb.inv_freq": "pytorch_model-00036-of-00081.bin", "model.layers.37.input_layernorm.weight": "pytorch_model-00037-of-00081.bin", "model.layers.37.post_attention_layernorm.weight": "pytorch_model-00037-of-00081.bin", "model.layers.37.self_attn.q_proj.weight": "pytorch_model-00037-of-00081.bin", "model.layers.37.self_attn.k_proj.weight": "pytorch_model-00037-of-00081.bin", "model.layers.37.self_attn.v_proj.weight": "pytorch_model-00037-of-00081.bin", "model.layers.37.self_attn.o_proj.weight": "pytorch_model-00037-of-00081.bin", "model.layers.37.mlp.gate_proj.weight": "pytorch_model-00037-of-00081.bin", "model.layers.37.mlp.down_proj.weight": "pytorch_model-00037-of-00081.bin", "model.layers.37.mlp.up_proj.weight": "pytorch_model-00037-of-00081.bin", "model.layers.37.self_attn.rotary_emb.inv_freq": "pytorch_model-00037-of-00081.bin", "model.layers.38.input_layernorm.weight": "pytorch_model-00038-of-00081.bin", "model.layers.38.post_attention_layernorm.weight": "pytorch_model-00038-of-00081.bin", "model.layers.38.self_attn.q_proj.weight": "pytorch_model-00038-of-00081.bin", "model.layers.38.self_attn.k_proj.weight": "pytorch_model-00038-of-00081.bin", "model.layers.38.self_attn.v_proj.weight": "pytorch_model-00038-of-00081.bin", "model.layers.38.self_attn.o_proj.weight": "pytorch_model-00038-of-00081.bin", "model.layers.38.mlp.gate_proj.weight": "pytorch_model-00038-of-00081.bin", "model.layers.38.mlp.down_proj.weight": "pytorch_model-00038-of-00081.bin", "model.layers.38.mlp.up_proj.weight": "pytorch_model-00038-of-00081.bin", "model.layers.38.self_attn.rotary_emb.inv_freq": "pytorch_model-00038-of-00081.bin", "model.layers.39.input_layernorm.weight": "pytorch_model-00039-of-00081.bin", "model.layers.39.post_attention_layernorm.weight": "pytorch_model-00039-of-00081.bin", "model.layers.39.self_attn.q_proj.weight": "pytorch_model-00039-of-00081.bin", "model.layers.39.self_attn.k_proj.weight": "pytorch_model-00039-of-00081.bin", "model.layers.39.self_attn.v_proj.weight": "pytorch_model-00039-of-00081.bin", "model.layers.39.self_attn.o_proj.weight": "pytorch_model-00039-of-00081.bin", "model.layers.39.mlp.gate_proj.weight": "pytorch_model-00039-of-00081.bin", "model.layers.39.mlp.down_proj.weight": "pytorch_model-00039-of-00081.bin", "model.layers.39.mlp.up_proj.weight": "pytorch_model-00039-of-00081.bin", "model.layers.39.self_attn.rotary_emb.inv_freq": "pytorch_model-00039-of-00081.bin", "model.layers.40.input_layernorm.weight": "pytorch_model-00040-of-00081.bin", "model.layers.40.post_attention_layernorm.weight": "pytorch_model-00040-of-00081.bin", "model.layers.40.self_attn.q_proj.weight": "pytorch_model-00040-of-00081.bin", "model.layers.40.self_attn.k_proj.weight": "pytorch_model-00040-of-00081.bin", "model.layers.40.self_attn.v_proj.weight": "pytorch_model-00040-of-00081.bin", "model.layers.40.self_attn.o_proj.weight": "pytorch_model-00040-of-00081.bin", "model.layers.40.mlp.gate_proj.weight": "pytorch_model-00040-of-00081.bin", "model.layers.40.mlp.down_proj.weight": "pytorch_model-00040-of-00081.bin", "model.layers.40.mlp.up_proj.weight": "pytorch_model-00040-of-00081.bin", "model.layers.40.self_attn.rotary_emb.inv_freq": "pytorch_model-00040-of-00081.bin", "model.layers.41.input_layernorm.weight": "pytorch_model-00041-of-00081.bin", "model.layers.41.post_attention_layernorm.weight": "pytorch_model-00041-of-00081.bin", "model.layers.41.self_attn.q_proj.weight": "pytorch_model-00041-of-00081.bin", "model.layers.41.self_attn.k_proj.weight": "pytorch_model-00041-of-00081.bin", "model.layers.41.self_attn.v_proj.weight": "pytorch_model-00041-of-00081.bin", "model.layers.41.self_attn.o_proj.weight": "pytorch_model-00041-of-00081.bin", "model.layers.41.mlp.gate_proj.weight": "pytorch_model-00041-of-00081.bin", "model.layers.41.mlp.down_proj.weight": "pytorch_model-00041-of-00081.bin", "model.layers.41.mlp.up_proj.weight": "pytorch_model-00041-of-00081.bin", "model.layers.41.self_attn.rotary_emb.inv_freq": "pytorch_model-00041-of-00081.bin", "model.layers.42.input_layernorm.weight": "pytorch_model-00042-of-00081.bin", "model.layers.42.post_attention_layernorm.weight": "pytorch_model-00042-of-00081.bin", "model.layers.42.self_attn.q_proj.weight": "pytorch_model-00042-of-00081.bin", "model.layers.42.self_attn.k_proj.weight": "pytorch_model-00042-of-00081.bin", "model.layers.42.self_attn.v_proj.weight": "pytorch_model-00042-of-00081.bin", "model.layers.42.self_attn.o_proj.weight": "pytorch_model-00042-of-00081.bin", "model.layers.42.mlp.gate_proj.weight": "pytorch_model-00042-of-00081.bin", "model.layers.42.mlp.down_proj.weight": "pytorch_model-00042-of-00081.bin", "model.layers.42.mlp.up_proj.weight": "pytorch_model-00042-of-00081.bin", "model.layers.42.self_attn.rotary_emb.inv_freq": "pytorch_model-00042-of-00081.bin", "model.layers.43.input_layernorm.weight": "pytorch_model-00043-of-00081.bin", "model.layers.43.post_attention_layernorm.weight": "pytorch_model-00043-of-00081.bin", "model.layers.43.self_attn.q_proj.weight": "pytorch_model-00043-of-00081.bin", "model.layers.43.self_attn.k_proj.weight": "pytorch_model-00043-of-00081.bin", "model.layers.43.self_attn.v_proj.weight": "pytorch_model-00043-of-00081.bin", "model.layers.43.self_attn.o_proj.weight": "pytorch_model-00043-of-00081.bin", "model.layers.43.mlp.gate_proj.weight": "pytorch_model-00043-of-00081.bin", "model.layers.43.mlp.down_proj.weight": "pytorch_model-00043-of-00081.bin", "model.layers.43.mlp.up_proj.weight": "pytorch_model-00043-of-00081.bin", "model.layers.43.self_attn.rotary_emb.inv_freq": "pytorch_model-00043-of-00081.bin", "model.layers.44.input_layernorm.weight": "pytorch_model-00044-of-00081.bin", "model.layers.44.post_attention_layernorm.weight": "pytorch_model-00044-of-00081.bin", "model.layers.44.self_attn.q_proj.weight": "pytorch_model-00044-of-00081.bin", "model.layers.44.self_attn.k_proj.weight": "pytorch_model-00044-of-00081.bin", "model.layers.44.self_attn.v_proj.weight": "pytorch_model-00044-of-00081.bin", "model.layers.44.self_attn.o_proj.weight": "pytorch_model-00044-of-00081.bin", "model.layers.44.mlp.gate_proj.weight": "pytorch_model-00044-of-00081.bin", "model.layers.44.mlp.down_proj.weight": "pytorch_model-00044-of-00081.bin", "model.layers.44.mlp.up_proj.weight": "pytorch_model-00044-of-00081.bin", "model.layers.44.self_attn.rotary_emb.inv_freq": "pytorch_model-00044-of-00081.bin", "model.layers.45.input_layernorm.weight": "pytorch_model-00045-of-00081.bin", "model.layers.45.post_attention_layernorm.weight": "pytorch_model-00045-of-00081.bin", "model.layers.45.self_attn.q_proj.weight": "pytorch_model-00045-of-00081.bin", "model.layers.45.self_attn.k_proj.weight": "pytorch_model-00045-of-00081.bin", "model.layers.45.self_attn.v_proj.weight": "pytorch_model-00045-of-00081.bin", "model.layers.45.self_attn.o_proj.weight": "pytorch_model-00045-of-00081.bin", "model.layers.45.mlp.gate_proj.weight": "pytorch_model-00045-of-00081.bin", "model.layers.45.mlp.down_proj.weight": "pytorch_model-00045-of-00081.bin", "model.layers.45.mlp.up_proj.weight": "pytorch_model-00045-of-00081.bin", "model.layers.45.self_attn.rotary_emb.inv_freq": "pytorch_model-00045-of-00081.bin", "model.layers.46.input_layernorm.weight": "pytorch_model-00046-of-00081.bin", "model.layers.46.post_attention_layernorm.weight": "pytorch_model-00046-of-00081.bin", "model.layers.46.self_attn.q_proj.weight": "pytorch_model-00046-of-00081.bin", "model.layers.46.self_attn.k_proj.weight": "pytorch_model-00046-of-00081.bin", "model.layers.46.self_attn.v_proj.weight": "pytorch_model-00046-of-00081.bin", "model.layers.46.self_attn.o_proj.weight": "pytorch_model-00046-of-00081.bin", "model.layers.46.mlp.gate_proj.weight": "pytorch_model-00046-of-00081.bin", "model.layers.46.mlp.down_proj.weight": "pytorch_model-00046-of-00081.bin", "model.layers.46.mlp.up_proj.weight": "pytorch_model-00046-of-00081.bin", "model.layers.46.self_attn.rotary_emb.inv_freq": "pytorch_model-00046-of-00081.bin", "model.layers.47.input_layernorm.weight": "pytorch_model-00047-of-00081.bin", "model.layers.47.post_attention_layernorm.weight": "pytorch_model-00047-of-00081.bin", "model.layers.47.self_attn.q_proj.weight": "pytorch_model-00047-of-00081.bin", "model.layers.47.self_attn.k_proj.weight": "pytorch_model-00047-of-00081.bin", "model.layers.47.self_attn.v_proj.weight": "pytorch_model-00047-of-00081.bin", "model.layers.47.self_attn.o_proj.weight": "pytorch_model-00047-of-00081.bin", "model.layers.47.mlp.gate_proj.weight": "pytorch_model-00047-of-00081.bin", "model.layers.47.mlp.down_proj.weight": "pytorch_model-00047-of-00081.bin", "model.layers.47.mlp.up_proj.weight": "pytorch_model-00047-of-00081.bin", "model.layers.47.self_attn.rotary_emb.inv_freq": "pytorch_model-00047-of-00081.bin", "model.layers.48.input_layernorm.weight": "pytorch_model-00048-of-00081.bin", "model.layers.48.post_attention_layernorm.weight": "pytorch_model-00048-of-00081.bin", "model.layers.48.self_attn.q_proj.weight": "pytorch_model-00048-of-00081.bin", "model.layers.48.self_attn.k_proj.weight": "pytorch_model-00048-of-00081.bin", "model.layers.48.self_attn.v_proj.weight": "pytorch_model-00048-of-00081.bin", "model.layers.48.self_attn.o_proj.weight": "pytorch_model-00048-of-00081.bin", "model.layers.48.mlp.gate_proj.weight": "pytorch_model-00048-of-00081.bin", "model.layers.48.mlp.down_proj.weight": "pytorch_model-00048-of-00081.bin", "model.layers.48.mlp.up_proj.weight": "pytorch_model-00048-of-00081.bin", "model.layers.48.self_attn.rotary_emb.inv_freq": "pytorch_model-00048-of-00081.bin", "model.layers.49.input_layernorm.weight": "pytorch_model-00049-of-00081.bin", "model.layers.49.post_attention_layernorm.weight": "pytorch_model-00049-of-00081.bin", "model.layers.49.self_attn.q_proj.weight": "pytorch_model-00049-of-00081.bin", "model.layers.49.self_attn.k_proj.weight": "pytorch_model-00049-of-00081.bin", "model.layers.49.self_attn.v_proj.weight": "pytorch_model-00049-of-00081.bin", "model.layers.49.self_attn.o_proj.weight": "pytorch_model-00049-of-00081.bin", "model.layers.49.mlp.gate_proj.weight": "pytorch_model-00049-of-00081.bin", "model.layers.49.mlp.down_proj.weight": "pytorch_model-00049-of-00081.bin", "model.layers.49.mlp.up_proj.weight": "pytorch_model-00049-of-00081.bin", "model.layers.49.self_attn.rotary_emb.inv_freq": "pytorch_model-00049-of-00081.bin", "model.layers.50.input_layernorm.weight": "pytorch_model-00050-of-00081.bin", "model.layers.50.post_attention_layernorm.weight": "pytorch_model-00050-of-00081.bin", "model.layers.50.self_attn.q_proj.weight": "pytorch_model-00050-of-00081.bin", "model.layers.50.self_attn.k_proj.weight": "pytorch_model-00050-of-00081.bin", "model.layers.50.self_attn.v_proj.weight": "pytorch_model-00050-of-00081.bin", "model.layers.50.self_attn.o_proj.weight": "pytorch_model-00050-of-00081.bin", "model.layers.50.mlp.gate_proj.weight": "pytorch_model-00050-of-00081.bin", "model.layers.50.mlp.down_proj.weight": "pytorch_model-00050-of-00081.bin", "model.layers.50.mlp.up_proj.weight": "pytorch_model-00050-of-00081.bin", "model.layers.50.self_attn.rotary_emb.inv_freq": "pytorch_model-00050-of-00081.bin", "model.layers.51.input_layernorm.weight": "pytorch_model-00051-of-00081.bin", "model.layers.51.post_attention_layernorm.weight": "pytorch_model-00051-of-00081.bin", "model.layers.51.self_attn.q_proj.weight": "pytorch_model-00051-of-00081.bin", "model.layers.51.self_attn.k_proj.weight": "pytorch_model-00051-of-00081.bin", "model.layers.51.self_attn.v_proj.weight": "pytorch_model-00051-of-00081.bin", "model.layers.51.self_attn.o_proj.weight": "pytorch_model-00051-of-00081.bin", "model.layers.51.mlp.gate_proj.weight": "pytorch_model-00051-of-00081.bin", "model.layers.51.mlp.down_proj.weight": "pytorch_model-00051-of-00081.bin", "model.layers.51.mlp.up_proj.weight": "pytorch_model-00051-of-00081.bin", "model.layers.51.self_attn.rotary_emb.inv_freq": "pytorch_model-00051-of-00081.bin", "model.layers.52.input_layernorm.weight": "pytorch_model-00052-of-00081.bin", "model.layers.52.post_attention_layernorm.weight": "pytorch_model-00052-of-00081.bin", "model.layers.52.self_attn.q_proj.weight": "pytorch_model-00052-of-00081.bin", "model.layers.52.self_attn.k_proj.weight": "pytorch_model-00052-of-00081.bin", "model.layers.52.self_attn.v_proj.weight": "pytorch_model-00052-of-00081.bin", "model.layers.52.self_attn.o_proj.weight": "pytorch_model-00052-of-00081.bin", "model.layers.52.mlp.gate_proj.weight": "pytorch_model-00052-of-00081.bin", "model.layers.52.mlp.down_proj.weight": "pytorch_model-00052-of-00081.bin", "model.layers.52.mlp.up_proj.weight": "pytorch_model-00052-of-00081.bin", "model.layers.52.self_attn.rotary_emb.inv_freq": "pytorch_model-00052-of-00081.bin", "model.layers.53.input_layernorm.weight": "pytorch_model-00053-of-00081.bin", "model.layers.53.post_attention_layernorm.weight": "pytorch_model-00053-of-00081.bin", "model.layers.53.self_attn.q_proj.weight": "pytorch_model-00053-of-00081.bin", "model.layers.53.self_attn.k_proj.weight": "pytorch_model-00053-of-00081.bin", "model.layers.53.self_attn.v_proj.weight": "pytorch_model-00053-of-00081.bin", "model.layers.53.self_attn.o_proj.weight": "pytorch_model-00053-of-00081.bin", "model.layers.53.mlp.gate_proj.weight": "pytorch_model-00053-of-00081.bin", "model.layers.53.mlp.down_proj.weight": "pytorch_model-00053-of-00081.bin", "model.layers.53.mlp.up_proj.weight": "pytorch_model-00053-of-00081.bin", "model.layers.53.self_attn.rotary_emb.inv_freq": "pytorch_model-00053-of-00081.bin", "model.layers.54.input_layernorm.weight": "pytorch_model-00054-of-00081.bin", "model.layers.54.post_attention_layernorm.weight": "pytorch_model-00054-of-00081.bin", "model.layers.54.self_attn.q_proj.weight": "pytorch_model-00054-of-00081.bin", "model.layers.54.self_attn.k_proj.weight": "pytorch_model-00054-of-00081.bin", "model.layers.54.self_attn.v_proj.weight": "pytorch_model-00054-of-00081.bin", "model.layers.54.self_attn.o_proj.weight": "pytorch_model-00054-of-00081.bin", "model.layers.54.mlp.gate_proj.weight": "pytorch_model-00054-of-00081.bin", "model.layers.54.mlp.down_proj.weight": "pytorch_model-00054-of-00081.bin", "model.layers.54.mlp.up_proj.weight": "pytorch_model-00054-of-00081.bin", "model.layers.54.self_attn.rotary_emb.inv_freq": "pytorch_model-00054-of-00081.bin", "model.layers.55.input_layernorm.weight": "pytorch_model-00055-of-00081.bin", "model.layers.55.post_attention_layernorm.weight": "pytorch_model-00055-of-00081.bin", "model.layers.55.self_attn.q_proj.weight": "pytorch_model-00055-of-00081.bin", "model.layers.55.self_attn.k_proj.weight": "pytorch_model-00055-of-00081.bin", "model.layers.55.self_attn.v_proj.weight": "pytorch_model-00055-of-00081.bin", "model.layers.55.self_attn.o_proj.weight": "pytorch_model-00055-of-00081.bin", "model.layers.55.mlp.gate_proj.weight": "pytorch_model-00055-of-00081.bin", "model.layers.55.mlp.down_proj.weight": "pytorch_model-00055-of-00081.bin", "model.layers.55.mlp.up_proj.weight": "pytorch_model-00055-of-00081.bin", "model.layers.55.self_attn.rotary_emb.inv_freq": "pytorch_model-00055-of-00081.bin", "model.layers.56.input_layernorm.weight": "pytorch_model-00056-of-00081.bin", "model.layers.56.post_attention_layernorm.weight": "pytorch_model-00056-of-00081.bin", "model.layers.56.self_attn.q_proj.weight": "pytorch_model-00056-of-00081.bin", "model.layers.56.self_attn.k_proj.weight": "pytorch_model-00056-of-00081.bin", "model.layers.56.self_attn.v_proj.weight": "pytorch_model-00056-of-00081.bin", "model.layers.56.self_attn.o_proj.weight": "pytorch_model-00056-of-00081.bin", "model.layers.56.mlp.gate_proj.weight": "pytorch_model-00056-of-00081.bin", "model.layers.56.mlp.down_proj.weight": "pytorch_model-00056-of-00081.bin", "model.layers.56.mlp.up_proj.weight": "pytorch_model-00056-of-00081.bin", "model.layers.56.self_attn.rotary_emb.inv_freq": "pytorch_model-00056-of-00081.bin", "model.layers.57.input_layernorm.weight": "pytorch_model-00057-of-00081.bin", "model.layers.57.post_attention_layernorm.weight": "pytorch_model-00057-of-00081.bin", "model.layers.57.self_attn.q_proj.weight": "pytorch_model-00057-of-00081.bin", "model.layers.57.self_attn.k_proj.weight": "pytorch_model-00057-of-00081.bin", "model.layers.57.self_attn.v_proj.weight": "pytorch_model-00057-of-00081.bin", "model.layers.57.self_attn.o_proj.weight": "pytorch_model-00057-of-00081.bin", "model.layers.57.mlp.gate_proj.weight": "pytorch_model-00057-of-00081.bin", "model.layers.57.mlp.down_proj.weight": "pytorch_model-00057-of-00081.bin", "model.layers.57.mlp.up_proj.weight": "pytorch_model-00057-of-00081.bin", "model.layers.57.self_attn.rotary_emb.inv_freq": "pytorch_model-00057-of-00081.bin", "model.layers.58.input_layernorm.weight": "pytorch_model-00058-of-00081.bin", "model.layers.58.post_attention_layernorm.weight": "pytorch_model-00058-of-00081.bin", "model.layers.58.self_attn.q_proj.weight": "pytorch_model-00058-of-00081.bin", "model.layers.58.self_attn.k_proj.weight": "pytorch_model-00058-of-00081.bin", "model.layers.58.self_attn.v_proj.weight": "pytorch_model-00058-of-00081.bin", "model.layers.58.self_attn.o_proj.weight": "pytorch_model-00058-of-00081.bin", "model.layers.58.mlp.gate_proj.weight": "pytorch_model-00058-of-00081.bin", "model.layers.58.mlp.down_proj.weight": "pytorch_model-00058-of-00081.bin", "model.layers.58.mlp.up_proj.weight": "pytorch_model-00058-of-00081.bin", "model.layers.58.self_attn.rotary_emb.inv_freq": "pytorch_model-00058-of-00081.bin", "model.layers.59.input_layernorm.weight": "pytorch_model-00059-of-00081.bin", "model.layers.59.post_attention_layernorm.weight": "pytorch_model-00059-of-00081.bin", "model.layers.59.self_attn.q_proj.weight": "pytorch_model-00059-of-00081.bin", "model.layers.59.self_attn.k_proj.weight": "pytorch_model-00059-of-00081.bin", "model.layers.59.self_attn.v_proj.weight": "pytorch_model-00059-of-00081.bin", "model.layers.59.self_attn.o_proj.weight": "pytorch_model-00059-of-00081.bin", "model.layers.59.mlp.gate_proj.weight": "pytorch_model-00059-of-00081.bin", "model.layers.59.mlp.down_proj.weight": "pytorch_model-00059-of-00081.bin", "model.layers.59.mlp.up_proj.weight": "pytorch_model-00059-of-00081.bin", "model.layers.59.self_attn.rotary_emb.inv_freq": "pytorch_model-00059-of-00081.bin", "model.layers.60.input_layernorm.weight": "pytorch_model-00060-of-00081.bin", "model.layers.60.post_attention_layernorm.weight": "pytorch_model-00060-of-00081.bin", "model.layers.60.self_attn.q_proj.weight": "pytorch_model-00060-of-00081.bin", "model.layers.60.self_attn.k_proj.weight": "pytorch_model-00060-of-00081.bin", "model.layers.60.self_attn.v_proj.weight": "pytorch_model-00060-of-00081.bin", "model.layers.60.self_attn.o_proj.weight": "pytorch_model-00060-of-00081.bin", "model.layers.60.mlp.gate_proj.weight": "pytorch_model-00060-of-00081.bin", "model.layers.60.mlp.down_proj.weight": "pytorch_model-00060-of-00081.bin", "model.layers.60.mlp.up_proj.weight": "pytorch_model-00060-of-00081.bin", "model.layers.60.self_attn.rotary_emb.inv_freq": "pytorch_model-00060-of-00081.bin", "model.layers.61.input_layernorm.weight": "pytorch_model-00061-of-00081.bin", "model.layers.61.post_attention_layernorm.weight": "pytorch_model-00061-of-00081.bin", "model.layers.61.self_attn.q_proj.weight": "pytorch_model-00061-of-00081.bin", "model.layers.61.self_attn.k_proj.weight": "pytorch_model-00061-of-00081.bin", "model.layers.61.self_attn.v_proj.weight": "pytorch_model-00061-of-00081.bin", "model.layers.61.self_attn.o_proj.weight": "pytorch_model-00061-of-00081.bin", "model.layers.61.mlp.gate_proj.weight": "pytorch_model-00061-of-00081.bin", "model.layers.61.mlp.down_proj.weight": "pytorch_model-00061-of-00081.bin", "model.layers.61.mlp.up_proj.weight": "pytorch_model-00061-of-00081.bin", "model.layers.61.self_attn.rotary_emb.inv_freq": "pytorch_model-00061-of-00081.bin", "model.layers.62.input_layernorm.weight": "pytorch_model-00062-of-00081.bin", "model.layers.62.post_attention_layernorm.weight": "pytorch_model-00062-of-00081.bin", "model.layers.62.self_attn.q_proj.weight": "pytorch_model-00062-of-00081.bin", "model.layers.62.self_attn.k_proj.weight": "pytorch_model-00062-of-00081.bin", "model.layers.62.self_attn.v_proj.weight": "pytorch_model-00062-of-00081.bin", "model.layers.62.self_attn.o_proj.weight": "pytorch_model-00062-of-00081.bin", "model.layers.62.mlp.gate_proj.weight": "pytorch_model-00062-of-00081.bin", "model.layers.62.mlp.down_proj.weight": "pytorch_model-00062-of-00081.bin", "model.layers.62.mlp.up_proj.weight": "pytorch_model-00062-of-00081.bin", "model.layers.62.self_attn.rotary_emb.inv_freq": "pytorch_model-00062-of-00081.bin", "model.layers.63.input_layernorm.weight": "pytorch_model-00063-of-00081.bin", "model.layers.63.post_attention_layernorm.weight": "pytorch_model-00063-of-00081.bin", "model.layers.63.self_attn.q_proj.weight": "pytorch_model-00063-of-00081.bin", "model.layers.63.self_attn.k_proj.weight": "pytorch_model-00063-of-00081.bin", "model.layers.63.self_attn.v_proj.weight": "pytorch_model-00063-of-00081.bin", "model.layers.63.self_attn.o_proj.weight": "pytorch_model-00063-of-00081.bin", "model.layers.63.mlp.gate_proj.weight": "pytorch_model-00063-of-00081.bin", "model.layers.63.mlp.down_proj.weight": "pytorch_model-00063-of-00081.bin", "model.layers.63.mlp.up_proj.weight": "pytorch_model-00063-of-00081.bin", "model.layers.63.self_attn.rotary_emb.inv_freq": "pytorch_model-00063-of-00081.bin", "model.layers.64.input_layernorm.weight": "pytorch_model-00064-of-00081.bin", "model.layers.64.post_attention_layernorm.weight": "pytorch_model-00064-of-00081.bin", "model.layers.64.self_attn.q_proj.weight": "pytorch_model-00064-of-00081.bin", "model.layers.64.self_attn.k_proj.weight": "pytorch_model-00064-of-00081.bin", "model.layers.64.self_attn.v_proj.weight": "pytorch_model-00064-of-00081.bin", "model.layers.64.self_attn.o_proj.weight": "pytorch_model-00064-of-00081.bin", "model.layers.64.mlp.gate_proj.weight": "pytorch_model-00064-of-00081.bin", "model.layers.64.mlp.down_proj.weight": "pytorch_model-00064-of-00081.bin", "model.layers.64.mlp.up_proj.weight": "pytorch_model-00064-of-00081.bin", "model.layers.64.self_attn.rotary_emb.inv_freq": "pytorch_model-00064-of-00081.bin", "model.layers.65.input_layernorm.weight": "pytorch_model-00065-of-00081.bin", "model.layers.65.post_attention_layernorm.weight": "pytorch_model-00065-of-00081.bin", "model.layers.65.self_attn.q_proj.weight": "pytorch_model-00065-of-00081.bin", "model.layers.65.self_attn.k_proj.weight": "pytorch_model-00065-of-00081.bin", "model.layers.65.self_attn.v_proj.weight": "pytorch_model-00065-of-00081.bin", "model.layers.65.self_attn.o_proj.weight": "pytorch_model-00065-of-00081.bin", "model.layers.65.mlp.gate_proj.weight": "pytorch_model-00065-of-00081.bin", "model.layers.65.mlp.down_proj.weight": "pytorch_model-00065-of-00081.bin", "model.layers.65.mlp.up_proj.weight": "pytorch_model-00065-of-00081.bin", "model.layers.65.self_attn.rotary_emb.inv_freq": "pytorch_model-00065-of-00081.bin", "model.layers.66.input_layernorm.weight": "pytorch_model-00066-of-00081.bin", "model.layers.66.post_attention_layernorm.weight": "pytorch_model-00066-of-00081.bin", "model.layers.66.self_attn.q_proj.weight": "pytorch_model-00066-of-00081.bin", "model.layers.66.self_attn.k_proj.weight": "pytorch_model-00066-of-00081.bin", "model.layers.66.self_attn.v_proj.weight": "pytorch_model-00066-of-00081.bin", "model.layers.66.self_attn.o_proj.weight": "pytorch_model-00066-of-00081.bin", "model.layers.66.mlp.gate_proj.weight": "pytorch_model-00066-of-00081.bin", "model.layers.66.mlp.down_proj.weight": "pytorch_model-00066-of-00081.bin", "model.layers.66.mlp.up_proj.weight": "pytorch_model-00066-of-00081.bin", "model.layers.66.self_attn.rotary_emb.inv_freq": "pytorch_model-00066-of-00081.bin", "model.layers.67.input_layernorm.weight": "pytorch_model-00067-of-00081.bin", "model.layers.67.post_attention_layernorm.weight": "pytorch_model-00067-of-00081.bin", "model.layers.67.self_attn.q_proj.weight": "pytorch_model-00067-of-00081.bin", "model.layers.67.self_attn.k_proj.weight": "pytorch_model-00067-of-00081.bin", "model.layers.67.self_attn.v_proj.weight": "pytorch_model-00067-of-00081.bin", "model.layers.67.self_attn.o_proj.weight": "pytorch_model-00067-of-00081.bin", "model.layers.67.mlp.gate_proj.weight": "pytorch_model-00067-of-00081.bin", "model.layers.67.mlp.down_proj.weight": "pytorch_model-00067-of-00081.bin", "model.layers.67.mlp.up_proj.weight": "pytorch_model-00067-of-00081.bin", "model.layers.67.self_attn.rotary_emb.inv_freq": "pytorch_model-00067-of-00081.bin", "model.layers.68.input_layernorm.weight": "pytorch_model-00068-of-00081.bin", "model.layers.68.post_attention_layernorm.weight": "pytorch_model-00068-of-00081.bin", "model.layers.68.self_attn.q_proj.weight": "pytorch_model-00068-of-00081.bin", "model.layers.68.self_attn.k_proj.weight": "pytorch_model-00068-of-00081.bin", "model.layers.68.self_attn.v_proj.weight": "pytorch_model-00068-of-00081.bin", "model.layers.68.self_attn.o_proj.weight": "pytorch_model-00068-of-00081.bin", "model.layers.68.mlp.gate_proj.weight": "pytorch_model-00068-of-00081.bin", "model.layers.68.mlp.down_proj.weight": "pytorch_model-00068-of-00081.bin", "model.layers.68.mlp.up_proj.weight": "pytorch_model-00068-of-00081.bin", "model.layers.68.self_attn.rotary_emb.inv_freq": "pytorch_model-00068-of-00081.bin", "model.layers.69.input_layernorm.weight": "pytorch_model-00069-of-00081.bin", "model.layers.69.post_attention_layernorm.weight": "pytorch_model-00069-of-00081.bin", "model.layers.69.self_attn.q_proj.weight": "pytorch_model-00069-of-00081.bin", "model.layers.69.self_attn.k_proj.weight": "pytorch_model-00069-of-00081.bin", "model.layers.69.self_attn.v_proj.weight": "pytorch_model-00069-of-00081.bin", "model.layers.69.self_attn.o_proj.weight": "pytorch_model-00069-of-00081.bin", "model.layers.69.mlp.gate_proj.weight": "pytorch_model-00069-of-00081.bin", "model.layers.69.mlp.down_proj.weight": "pytorch_model-00069-of-00081.bin", "model.layers.69.mlp.up_proj.weight": "pytorch_model-00069-of-00081.bin", "model.layers.69.self_attn.rotary_emb.inv_freq": "pytorch_model-00069-of-00081.bin", "model.layers.70.input_layernorm.weight": "pytorch_model-00070-of-00081.bin", "model.layers.70.post_attention_layernorm.weight": "pytorch_model-00070-of-00081.bin", "model.layers.70.self_attn.q_proj.weight": "pytorch_model-00070-of-00081.bin", "model.layers.70.self_attn.k_proj.weight": "pytorch_model-00070-of-00081.bin", "model.layers.70.self_attn.v_proj.weight": "pytorch_model-00070-of-00081.bin", "model.layers.70.self_attn.o_proj.weight": "pytorch_model-00070-of-00081.bin", "model.layers.70.mlp.gate_proj.weight": "pytorch_model-00070-of-00081.bin", "model.layers.70.mlp.down_proj.weight": "pytorch_model-00070-of-00081.bin", "model.layers.70.mlp.up_proj.weight": "pytorch_model-00070-of-00081.bin", "model.layers.70.self_attn.rotary_emb.inv_freq": "pytorch_model-00070-of-00081.bin", "model.layers.71.input_layernorm.weight": "pytorch_model-00071-of-00081.bin", "model.layers.71.post_attention_layernorm.weight": "pytorch_model-00071-of-00081.bin", "model.layers.71.self_attn.q_proj.weight": "pytorch_model-00071-of-00081.bin", "model.layers.71.self_attn.k_proj.weight": "pytorch_model-00071-of-00081.bin", "model.layers.71.self_attn.v_proj.weight": "pytorch_model-00071-of-00081.bin", "model.layers.71.self_attn.o_proj.weight": "pytorch_model-00071-of-00081.bin", "model.layers.71.mlp.gate_proj.weight": "pytorch_model-00071-of-00081.bin", "model.layers.71.mlp.down_proj.weight": "pytorch_model-00071-of-00081.bin", "model.layers.71.mlp.up_proj.weight": "pytorch_model-00071-of-00081.bin", "model.layers.71.self_attn.rotary_emb.inv_freq": "pytorch_model-00071-of-00081.bin", "model.layers.72.input_layernorm.weight": "pytorch_model-00072-of-00081.bin", "model.layers.72.post_attention_layernorm.weight": "pytorch_model-00072-of-00081.bin", "model.layers.72.self_attn.q_proj.weight": "pytorch_model-00072-of-00081.bin", "model.layers.72.self_attn.k_proj.weight": "pytorch_model-00072-of-00081.bin", "model.layers.72.self_attn.v_proj.weight": "pytorch_model-00072-of-00081.bin", "model.layers.72.self_attn.o_proj.weight": "pytorch_model-00072-of-00081.bin", "model.layers.72.mlp.gate_proj.weight": "pytorch_model-00072-of-00081.bin", "model.layers.72.mlp.down_proj.weight": "pytorch_model-00072-of-00081.bin", "model.layers.72.mlp.up_proj.weight": "pytorch_model-00072-of-00081.bin", "model.layers.72.self_attn.rotary_emb.inv_freq": "pytorch_model-00072-of-00081.bin", "model.layers.73.input_layernorm.weight": "pytorch_model-00073-of-00081.bin", "model.layers.73.post_attention_layernorm.weight": "pytorch_model-00073-of-00081.bin", "model.layers.73.self_attn.q_proj.weight": "pytorch_model-00073-of-00081.bin", "model.layers.73.self_attn.k_proj.weight": "pytorch_model-00073-of-00081.bin", "model.layers.73.self_attn.v_proj.weight": "pytorch_model-00073-of-00081.bin", "model.layers.73.self_attn.o_proj.weight": "pytorch_model-00073-of-00081.bin", "model.layers.73.mlp.gate_proj.weight": "pytorch_model-00073-of-00081.bin", "model.layers.73.mlp.down_proj.weight": "pytorch_model-00073-of-00081.bin", "model.layers.73.mlp.up_proj.weight": "pytorch_model-00073-of-00081.bin", "model.layers.73.self_attn.rotary_emb.inv_freq": "pytorch_model-00073-of-00081.bin", "model.layers.74.input_layernorm.weight": "pytorch_model-00074-of-00081.bin", "model.layers.74.post_attention_layernorm.weight": "pytorch_model-00074-of-00081.bin", "model.layers.74.self_attn.q_proj.weight": "pytorch_model-00074-of-00081.bin", "model.layers.74.self_attn.k_proj.weight": "pytorch_model-00074-of-00081.bin", "model.layers.74.self_attn.v_proj.weight": "pytorch_model-00074-of-00081.bin", "model.layers.74.self_attn.o_proj.weight": "pytorch_model-00074-of-00081.bin", "model.layers.74.mlp.gate_proj.weight": "pytorch_model-00074-of-00081.bin", "model.layers.74.mlp.down_proj.weight": "pytorch_model-00074-of-00081.bin", "model.layers.74.mlp.up_proj.weight": "pytorch_model-00074-of-00081.bin", "model.layers.74.self_attn.rotary_emb.inv_freq": "pytorch_model-00074-of-00081.bin", "model.layers.75.input_layernorm.weight": "pytorch_model-00075-of-00081.bin", "model.layers.75.post_attention_layernorm.weight": "pytorch_model-00075-of-00081.bin", "model.layers.75.self_attn.q_proj.weight": "pytorch_model-00075-of-00081.bin", "model.layers.75.self_attn.k_proj.weight": "pytorch_model-00075-of-00081.bin", "model.layers.75.self_attn.v_proj.weight": "pytorch_model-00075-of-00081.bin", "model.layers.75.self_attn.o_proj.weight": "pytorch_model-00075-of-00081.bin", "model.layers.75.mlp.gate_proj.weight": "pytorch_model-00075-of-00081.bin", "model.layers.75.mlp.down_proj.weight": "pytorch_model-00075-of-00081.bin", "model.layers.75.mlp.up_proj.weight": "pytorch_model-00075-of-00081.bin", "model.layers.75.self_attn.rotary_emb.inv_freq": "pytorch_model-00075-of-00081.bin", "model.layers.76.input_layernorm.weight": "pytorch_model-00076-of-00081.bin", "model.layers.76.post_attention_layernorm.weight": "pytorch_model-00076-of-00081.bin", "model.layers.76.self_attn.q_proj.weight": "pytorch_model-00076-of-00081.bin", "model.layers.76.self_attn.k_proj.weight": "pytorch_model-00076-of-00081.bin", "model.layers.76.self_attn.v_proj.weight": "pytorch_model-00076-of-00081.bin", "model.layers.76.self_attn.o_proj.weight": "pytorch_model-00076-of-00081.bin", "model.layers.76.mlp.gate_proj.weight": "pytorch_model-00076-of-00081.bin", "model.layers.76.mlp.down_proj.weight": "pytorch_model-00076-of-00081.bin", "model.layers.76.mlp.up_proj.weight": "pytorch_model-00076-of-00081.bin", "model.layers.76.self_attn.rotary_emb.inv_freq": "pytorch_model-00076-of-00081.bin", "model.layers.77.input_layernorm.weight": "pytorch_model-00077-of-00081.bin", "model.layers.77.post_attention_layernorm.weight": "pytorch_model-00077-of-00081.bin", "model.layers.77.self_attn.q_proj.weight": "pytorch_model-00077-of-00081.bin", "model.layers.77.self_attn.k_proj.weight": "pytorch_model-00077-of-00081.bin", "model.layers.77.self_attn.v_proj.weight": "pytorch_model-00077-of-00081.bin", "model.layers.77.self_attn.o_proj.weight": "pytorch_model-00077-of-00081.bin", "model.layers.77.mlp.gate_proj.weight": "pytorch_model-00077-of-00081.bin", "model.layers.77.mlp.down_proj.weight": "pytorch_model-00077-of-00081.bin", "model.layers.77.mlp.up_proj.weight": "pytorch_model-00077-of-00081.bin", "model.layers.77.self_attn.rotary_emb.inv_freq": "pytorch_model-00077-of-00081.bin", "model.layers.78.input_layernorm.weight": "pytorch_model-00078-of-00081.bin", "model.layers.78.post_attention_layernorm.weight": "pytorch_model-00078-of-00081.bin", "model.layers.78.self_attn.q_proj.weight": "pytorch_model-00078-of-00081.bin", "model.layers.78.self_attn.k_proj.weight": "pytorch_model-00078-of-00081.bin", "model.layers.78.self_attn.v_proj.weight": "pytorch_model-00078-of-00081.bin", "model.layers.78.self_attn.o_proj.weight": "pytorch_model-00078-of-00081.bin", "model.layers.78.mlp.gate_proj.weight": "pytorch_model-00078-of-00081.bin", "model.layers.78.mlp.down_proj.weight": "pytorch_model-00078-of-00081.bin", "model.layers.78.mlp.up_proj.weight": "pytorch_model-00078-of-00081.bin", "model.layers.78.self_attn.rotary_emb.inv_freq": "pytorch_model-00078-of-00081.bin", "model.layers.79.input_layernorm.weight": "pytorch_model-00079-of-00081.bin", "model.layers.79.post_attention_layernorm.weight": "pytorch_model-00079-of-00081.bin", "model.layers.79.self_attn.q_proj.weight": "pytorch_model-00079-of-00081.bin", "model.layers.79.self_attn.k_proj.weight": "pytorch_model-00079-of-00081.bin", "model.layers.79.self_attn.v_proj.weight": "pytorch_model-00079-of-00081.bin", "model.layers.79.self_attn.o_proj.weight": "pytorch_model-00079-of-00081.bin", "model.layers.79.mlp.gate_proj.weight": "pytorch_model-00079-of-00081.bin", "model.layers.79.mlp.down_proj.weight": "pytorch_model-00079-of-00081.bin", "model.layers.79.mlp.up_proj.weight": "pytorch_model-00079-of-00081.bin", "model.layers.79.self_attn.rotary_emb.inv_freq": "pytorch_model-00079-of-00081.bin", "model.norm.weight": "pytorch_model-00080-of-00081.bin", "model.embed_tokens.weight": "pytorch_model-00080-of-00081.bin", "lm_head.weight": "pytorch_model-00080-of-00081.bin"}, "metadata": {"total_size": 130571331584}} \ No newline at end of file