at676 commited on
Commit
39ad130
·
verified ·
1 Parent(s): dc1ef53

Upload folder using huggingface_hub (#1)

Browse files

- 36a9ed17d8e99bdefb74b7f12d0ccc87c7ef2dcbe6d4a9964056f0344882f9f7 (3e4e49e5692387e6c278bc304eb856b7533f3961)
- e91fee41687cc861de58964c4e5f83296311fb1600b5dd1ac8b8a56ce1ff00a2 (3540da30d8e2ce07f3bb783623204f358e050e8a)
- 3892bfba3a9b6a2e1a8cf383a8cba4c575e71b93739e190074b5b0ccd5f178bb (3bfbd21cd57f5a3d149902f5546ffcbb2380f0bd)
- 93cd74d06c1647945c5df258d2c7289ad10df2c4e1bcf89bce3bee2f4cd6d0fa (7ec76d0602a1a7bf0ded6b7ed4737b570a7f8b76)
- cafa3c0676737cc2594130d91b0aa4925fa4dfa6ef134d958fb312329ec70479 (811e0ed715f25cc1b5e1a26d087c1126913c573b)
- 8816b9d3dd8673f0c440f84b1bc4871d03fe504e94d9cc68e9957021b00053cf (5f77302eb49edcc329b5bfa1ac8bef87a6f3ff43)
- 19325b2bd849a29641b174366b484b9a0d425da14d0a350ceac251751c7de66d (8e2e6e2606010372c5af72f5423a4c51c7cde3b9)
- 039c78c806223583a09e5ded6eda9ceab311aeab289558f32bf0ad36b949c1f3 (450a0ae1f8d37ce6cbb19bf9845a0787c97eef4a)

config.json ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "meta-llama/Llama-2-70b-chat-hf",
3
+ "architectures": [
4
+ "LlamaForCausalLM"
5
+ ],
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 1,
9
+ "eos_token_id": 2,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 8192,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 28672,
14
+ "max_position_embeddings": 4096,
15
+ "mlp_bias": false,
16
+ "model_type": "llama",
17
+ "num_attention_heads": 64,
18
+ "num_hidden_layers": 80,
19
+ "num_key_value_heads": 8,
20
+ "pretraining_tp": 1,
21
+ "quip_params": {
22
+ "K": 4,
23
+ "L": 16,
24
+ "V": 2,
25
+ "codebook": "bitshift",
26
+ "codebook_version": 0,
27
+ "decode_mode": "quantlut_sym",
28
+ "td_x": 16,
29
+ "td_y": 16,
30
+ "tlut_bits": 9
31
+ },
32
+ "rms_norm_eps": 1e-05,
33
+ "rope_scaling": null,
34
+ "rope_theta": 10000.0,
35
+ "tie_word_embeddings": false,
36
+ "torch_dtype": "float16",
37
+ "transformers_version": "4.44.2",
38
+ "use_cache": true,
39
+ "vocab_size": 32000
40
+ }
generation_config.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token_id": 1,
3
+ "do_sample": true,
4
+ "eos_token_id": 2,
5
+ "max_length": 4096,
6
+ "pad_token_id": 0,
7
+ "temperature": 0.6,
8
+ "top_p": 0.9,
9
+ "transformers_version": "4.44.2"
10
+ }
model-00001-of-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f288b5eb8ce22c9cb074c5ffc67b64dd66b1475ea18c18c50807634a6aed0ab
3
+ size 4883545208
model-00002-of-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7263c31313c11e50212f2f48164cc23e65400d3b89f17bb29e4f6a15479ddccd
3
+ size 4947116832
model-00003-of-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbf691073bc35d9d476e4948dfa3789b33728330b65b60e31e0994df98ddacba
3
+ size 4905181440
model-00004-of-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:247ebd81283d85a4cbf15e1c9a01c13f12ff4e5abcab7dc3c8e8f89df58cf3d1
3
+ size 4947116832
model-00005-of-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05468c0bd5c37c8c7706191a458e412c437f1bd46f3b6b60226dcb740e516db5
3
+ size 4905181440
model-00006-of-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c254837c2cdfd8d53108f40108b09cb1fdb99ade083b65cf9aacbc1ed655d0a
3
+ size 4947116832
model-00007-of-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d6331adb1892870a712d1a1e494e8440f8507c0b5ff18a8f8ad73b22120e97f
3
+ size 4905181440
model-00008-of-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1988650e33be854c15399760d1aa35124592704c769c2cc6b1abdd6e875ec366
3
+ size 877016624
model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff