Adding more results
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- params/phi/4/rnd_search/comb_16/init/lm_head/_0.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/lm_head/_s.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.0.mlp.fc1/_0.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.0.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.0.mlp.fc2/_0.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.0.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.0.self_attn.dense/_0.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.0.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.1.mlp.fc1/_0.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.1.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.1.mlp.fc2/_0.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.1.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.1.self_attn.dense/_0.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.1.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.10.mlp.fc1/_0.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.10.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.10.mlp.fc2/_0.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.10.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.10.self_attn.dense/_0.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.10.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.11.mlp.fc1/_0.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.11.mlp.fc1/_s.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.11.mlp.fc2/_0.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.11.mlp.fc2/_s.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.11.self_attn.dense/_0.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.11.self_attn.dense/_s.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.11.self_attn.k_proj/_0.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.11.self_attn.q_proj/_0.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.11.self_attn.v_proj/_0.pt +3 -0
- params/phi/4/rnd_search/comb_16/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
params/phi/4/rnd_search/comb_16/init/lm_head/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8081136000b352fef582081fa6d34d148cb798dfd4c35b4c3c8aaa65b5a92dfa
|
3 |
+
size 205955
|
params/phi/4/rnd_search/comb_16/init/lm_head/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dbe8c219a1bb4f49eaa5f9dd324ef5649693dfa9acf5f601187eda94523138e0
|
3 |
+
size 205955
|
params/phi/4/rnd_search/comb_16/init/model.layers.0.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:abdc1842618c11e53a56d012b6b80d7f365c13c9b4959b7f03b89e6343fc6595
|
3 |
+
size 42115
|
params/phi/4/rnd_search/comb_16/init/model.layers.0.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2812af787d5e16078a06d8b4b33d902559f26e67bfba1a29558fa7492bc2c57
|
3 |
+
size 42115
|
params/phi/4/rnd_search/comb_16/init/model.layers.0.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e79c42cc36ea357bc12f75bc1c63aea4951313262a227e11f1872c4f2ecd7242
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.0.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:41bd1397b31269896be80577dab91c91bb7894921f68d27163c2fb1b6a2bc25e
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.0.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:33773d4001c5e938843a716d8879657746d6b42f004064db8c3ca43c79f2e3f8
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.0.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:57db23719c74a2bb5136d0ba917417164e1e73abf070ce37858481a53f0f866a
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.0.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d48f8dd53b6c3c22079f1c360a7a8eece1fa3b2135a5031d1cd724a581bd779f
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.0.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7743782d68d172e149b8b50aed5109cda1d44278fc3c648eabf57611c6143f3b
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.0.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:76fc0fd9afeca7fbbe1707aaeed14fdd81d580c7bac76bc92fa4edaa3fd9afa8
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.0.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2f245ea1ce77c4cafdb6bd0397c96252c055e64ea0f3440d12837bd7ce8315f4
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.0.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ddb8259ba2be66d6c5f0b9bf74761dcd86ee06410223948482994a410228049
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.0.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1ac392877175da5aaa714fc666b7d80325d4506f8502e8108385ca4e83216991
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.1.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:61800c9881225efe2475647e6df934497b21e5cad3bf811eeda6426bf55812c2
|
3 |
+
size 42115
|
params/phi/4/rnd_search/comb_16/init/model.layers.1.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb6312f871a4544c44f8609cd0b251493b082f265112915d7179b69a107a9ad1
|
3 |
+
size 42115
|
params/phi/4/rnd_search/comb_16/init/model.layers.1.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:291dc55a021448ec23b297005c343a2c979cf1709f0fe83c0dc68bd24ebc1e16
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.1.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c0406ac1ab305e0ce50a5ecf4c11797322a4ba421126c8afc9170a16f8412b13
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.1.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb8e255b013f88eff388b1fe179388499718d037d92eb6c92a9fef8febb658df
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.1.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:081648208bce392bc7508fce676438822fdc1867d9f8d053cc7b49ab18da2384
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.1.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:91f1dd3918549e320f115fecbc9d61215c4ab05a8cf8511c4c6d5eed20a840b3
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.1.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7e71b57b056a9824f056848cc89d738080869632f778356dfdf2b05f83d44b3
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.1.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af7a12a3c3ab1109e3d77e0bab6cf2f8c16cc51148766dd3cf06f91adfcb8c10
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.1.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3e9b4236f5d75e8284a1cffec1eb00b3ee262e88964ce5a51555d96e529ed07f
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.1.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f77f0dfe18870f5969a50fc4661ab36f14e9dfa3e4a0b36d2a188f871808a6d1
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.1.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:95271ea60c5d80f9c4338f5012954083747f1c5cd7bedb20b5ff90dc03feefe0
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.10.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:76468ffa5b8689b4f148b3b4b4b708fb802b1a592e8e91473e5434bccecc901a
|
3 |
+
size 42115
|
params/phi/4/rnd_search/comb_16/init/model.layers.10.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b5d3e66675d2ba6c43cf54db7412874864872826a7fe44fe7cdaf04442f68de1
|
3 |
+
size 42115
|
params/phi/4/rnd_search/comb_16/init/model.layers.10.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f700d1cc105e177ca724050a2cafcc0c004445d6d3e4cd4233ed94a6dd801eda
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.10.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:833720b521835b7ea7e93b0cc6c50f8c8af4d0b1e13c3d45fedefeac6c6222e0
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.10.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ba8302e4782eac2acaec4ad56e590481c42e7f44121cedf965d5c1b7c2bfa48e
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.10.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ab44f305c5af23b4eb5a59e4a35b28342f6c7225a91c1b486e9e87f0ed31fd1
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.10.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e4c5786a30f4ee4b19b6e4b10fd2ad7274278e8e6113a0040e62b0b9d0ed1f4c
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.10.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a086fc4d58b4f668d616e5547141c46cb64bf943650f5410ad036b43f225e8e
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.10.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f2066b539183f0ce242521c0179555ed57ab75ffaeec197042fee7071c78fc7
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.10.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:79aefe0df4a2dfee08f1947c9932c06f0fe63886478c7725c92e346488fd9bc7
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.10.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e6d1d4307d95ddb6ffcf94988c4129f4261bfde10014e9ed600c9785cf04807e
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.10.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f0df23fff0254571c7851dec6fb55e931912614caef974e4ed1c498e8c024dbd
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.11.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:507eace57f9b0452538055cfc4bacaf35ad6b7744a49226bdca444a1ec3cdccd
|
3 |
+
size 42115
|
params/phi/4/rnd_search/comb_16/init/model.layers.11.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f7716dd9f71c534e7e6ccb119ac5d28474bce95a0f766e55289fe984d660cfa4
|
3 |
+
size 42115
|
params/phi/4/rnd_search/comb_16/init/model.layers.11.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:21371820c5696586e209954ba94878258578f5f99271a6312f77e2be5496d337
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.11.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:befe7ae972f3855ca8ab2a8f8fff3dd6a3bc14ae3d25056d42c627d37489c636
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.11.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5a6d15209a25745012238db835c72ba1a51f7fa465e9257038166a0852e2a012
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.11.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c1d75cfcde41c113260af7976cdbd83a1138746716ca4113c2502108ed47f0e
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.11.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5279fe052f339e3f63dd3de0ff3193397d692c4ef67b06f1066d4c33838b99a4
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.11.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82e35279e626b400b4fcacba18d80339639bce79483b141c274d89a8d4f76550
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.11.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:95bfbae9de09af467a6152484daf90f76e256979ae4a7fe0ecbfec5ee4adce77
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.11.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c4f74d57bb6bff7f3e345aec603be05a9a246394bc47ee884cd4ae2681811188
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.11.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a63fc9278d45bf212f7481fa68d5cbc21639e68f1bb644a7bf411be496c93417
|
3 |
+
size 11395
|
params/phi/4/rnd_search/comb_16/init/model.layers.11.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ba7661105333952946aa5983e581cdb1ddbefab4929861ad75f4eb2a755cc32d
|
3 |
+
size 11395
|