Adding more results
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- params/phi/4/rnd_search/comb_2/init/lm_head/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.0.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.0.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.0.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.1.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.1.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.1.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.10.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.10.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.10.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.11.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.11.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.11.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.12.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.12.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.12.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.12.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.12.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.12.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.13.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.13.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.13.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.13.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.13.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.13.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.14.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.14.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.14.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.14.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.14.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.14.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.15.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.15.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.15.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.15.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.15.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.15.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_2/init/model.layers.16.mlp.fc1/_s.pt +3 -0
params/phi/4/rnd_search/comb_2/init/lm_head/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d4c4126615662a10ad18a6f91116d844af6c80ccd760919acc20e85baea28d6
|
3 |
+
size 205955
|
params/phi/4/rnd_search/comb_2/init/model.layers.0.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c4de17ea97aa5610de68a8acea84e95e15f68474be5113a053590b16ceea710f
|
3 |
+
size 42115
|
params/phi/4/rnd_search/comb_2/init/model.layers.0.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1fa59e009baad97f83eb5dc7936da7d9cbfbab3deec26b4a23eaf90f581c7c1c
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.0.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c4aca3dbaa8683cae23c89ba678421974be573609563f5efeb997a42559f3c9
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.0.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:325f1efc3bd61494f24fcc3e20d62fa8d235358afa07937cffe751d85b433eb0
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.0.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:342ba12fe34030959afa0b2fcf007445a25b276c1ae770acba9d743ca5f3dd67
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.0.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df95240568cbb5d45dfba50f5510cc13f2db2711b1846463558c38b628fb2f4b
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.1.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fce452c7e8c91d3cc8de2efbfe0767e26035eb97543a810b15fb4a95d62b3fe9
|
3 |
+
size 42115
|
params/phi/4/rnd_search/comb_2/init/model.layers.1.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9bb03a58f38c617bac5475d8659f699a8113e801db8cad0637caf147c4ac8867
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.1.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2858786f5d602f6c7aaeeb48bf5866ca6e58968378bed41bd5a07c7565cd76f
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.1.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fcb79e6bc1e0569653a9c830439bebd83b58dd2c89bf3f400610d4305c1b6f55
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.1.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6462385258bbf7f051bf10c7b2c5f4113c1bce913b6d8dad66c843f948bab974
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.1.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8ca527099b1db2f9e1e687cd4f0e749f8145918df1da569e451f893a531370e
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.10.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a77e02d48a77d964a4863674b35c0d8344e604118e5269e3dfd39beda892c25e
|
3 |
+
size 42115
|
params/phi/4/rnd_search/comb_2/init/model.layers.10.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ca90e9010b6f403f80561dcaf0b20690338ac896cc8a0861b37628bfa2468b7
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.10.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8c5d8fdce79af3159517121e77efe5f99f0449ce06dec06118e310f330747df
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.10.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:766119cd6ed661ae763da26cff2f7ce9941b3a24da7c75a8045226719bd41905
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.10.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4aa5fca52e16fcbbf7274bc1b8c2437fb419a5145f848375c59d440b25324b14
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.10.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e4ad113732576faec0f33e6570ce56073a8fc76e27ae47fc443219d95bce2e22
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.11.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bb6811a5d04a546518cf9965ac35b49d39c325f3de80481ba4230c90e93cbec1
|
3 |
+
size 42115
|
params/phi/4/rnd_search/comb_2/init/model.layers.11.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b9c51a7ce96b8f989696d04bf04835bbf4656c4c52c7ef304bab7e7f6513b1eb
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.11.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e87bd40befac73a31c22476cbc1693f10fb6c80178676ce31e1123ae6d222a13
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.11.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b468ea9ae9f5669d8ca62868c794d7c849c15e08105cac5b27ab8837e4f3e890
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.11.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8768a9643513f5163894a2cc37ea176090820165bb8542ffdab5ceaf9c4a03f8
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.11.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4cbbde64a979c0e2962d48ece2efd33e01d286174263f4ae14a51a5a3fed4924
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.12.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bcb521f646d66cd360c2f62b30326c0d6771e30b532f886d76295b101696cac8
|
3 |
+
size 42115
|
params/phi/4/rnd_search/comb_2/init/model.layers.12.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b4f70627e708dd2ace7e58c937e62a21c92ba7b24822c59b6917ad3a0b09e9eb
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.12.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6aa1591a2e93e47e6a9a88d9c6b5d4a34f2b06f215098cbe90de2f40f4ca7dad
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.12.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:712a9373cba63274435fba0ec1bbf6cda213a6b56ea7aa149dea9db01f7f2d5d
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.12.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3427aa724100af5b070f31601de62b9c657c8ac655da270a7f9928a66817ea0
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.12.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6bc291e7f89f19a711f5a2bea8b281db645423cfe05623eb36583547c4bff822
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.13.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bdf1e41829250c4e9a286ce7c583c3c5909a5271c9ac98b6c882933d6d682783
|
3 |
+
size 42115
|
params/phi/4/rnd_search/comb_2/init/model.layers.13.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6aa3c0234cd710033371d8b80b5ee67a456c8167c43fd54438951ab002324d5c
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.13.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:92d6c3d79d4579fe08cf9cadc557fcb57df3b2ca8000aa3cc37c8d29dfb0bdb9
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.13.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c833b268afceaa2fdbab236f04d131f867604f6d85c7928ed3e1b1c227803e77
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.13.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4caaf0516627f400d68682701707919ba56f719fb68091456e5d42fba780dc14
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.13.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:675c30e9669abeac448fee92d469ba315b73f4d458009a166c59d7647517235d
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.14.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa1faa9a72b76f2f24c331c3f446221e8aaa6cdfd024b1b3803d9ad75e686fb4
|
3 |
+
size 42115
|
params/phi/4/rnd_search/comb_2/init/model.layers.14.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2503ee3406478d3da653794408073a63f42f3edcd2b7885491f8ddac655e1f68
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.14.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5094182c47f7f6a5f9de152354390d5fa4b1a6b665c4c79b3fab57787606b1b
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.14.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6d1ed9579047623326609b4535936645505f4714b395d5b5e523621cd8b109a6
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.14.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3c3d5b91c54838b5d14e70e22fb0a456b72c34274378332d563f86368221d87d
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.14.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ce4ce7af499040d842c79c7c590c21630555eec2bf7b7286d96d81ec7a43863a
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.15.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f84fcbfc93a7c9aa1e87ac6eaea3d2ced8e981c94843c712108102895b24884
|
3 |
+
size 42115
|
params/phi/4/rnd_search/comb_2/init/model.layers.15.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e0da0b0a586f40e1551a52cd33cdfba46b9351dda20b9defafb78e8cbe6234e
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.15.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb75e32bb26a31bfc4c5cd83893c1ea58e6c2395b7765affbf0678587b2bc04f
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.15.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:996b785566ca56794a69a301824d00cc640dc1e6d3f83eb71bb9b7e63862241d
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.15.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4945924601239eac91e5726a9609f3ac2b1a95e89bbdbd459653b34e3143b79a
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.15.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3d23b95b7acf41e4c4b1da0d50096681657d0aaa9dac823852aa900ba444a3c7
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_2/init/model.layers.16.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:20cf4a5e8275bab8000a5b85fe35ff23f27584a2812ccb6ed401fe87a7f4b826
|
3 |
+
size 42115
|