Upload folder using huggingface_hub

Files changed (9) hide show

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B",
   "architectures": [
     "Qwen2ForCausalLM"
   ],
@@ -9,12 +9,12 @@
   "hidden_act": "silu",
   "hidden_size": 5120,
   "initializer_range": 0.02,
-  "intermediate_size": 13824,
   "max_position_embeddings": 131072,
-  "max_window_layers": 48,
   "model_type": "qwen2",
   "num_attention_heads": 40,
-  "num_hidden_layers": 48,
   "num_key_value_heads": 8,
   "quantization_config": {
     "config_groups": {
@@ -50,7 +50,7 @@
       }
     },
     "format": "float-quantized",
-    "global_compression_ratio": 1.531585969025769,
     "ignore": [
       "lm_head"
     ],

 {
+  "_name_or_path": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B",
   "architectures": [
     "Qwen2ForCausalLM"
   ],
   "hidden_act": "silu",
   "hidden_size": 5120,
   "initializer_range": 0.02,
+  "intermediate_size": 27648,
   "max_position_embeddings": 131072,
+  "max_window_layers": 64,
   "model_type": "qwen2",
   "num_attention_heads": 40,
+  "num_hidden_layers": 64,
   "num_key_value_heads": 8,
   "quantization_config": {
     "config_groups": {
       }
     },
     "format": "float-quantized",
+    "global_compression_ratio": 1.533275278369312,
     "ignore": [
       "lm_head"
     ],

model-00001-of-00007.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:fd8ff997ac8f8599761f6297e9f172a292805788909b8dcc6cc376f8cfc33b4c
+size 4997762744

model-00002-of-00007.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:b6ac42fc7f546f2d45c983dffc5a34d542a6be7ee7673b54bfdd4c12202402c6
+size 4914421680

model-00003-of-00007.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:294b3d86ffc0fe422297c770beeb7669aeb74d7050b70d1d3d71929fe38179a2
+size 4877702248

model-00004-of-00007.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:408d2458e103566b1c848c3226505db8acffb5096e2435c65ff8dc95f5aef6a2
+size 4877702248

model-00005-of-00007.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:5c8fe5fc6dd376bc078bba9d190fdf31f53a920e58e0b93accba9acbffb7ec75
+size 4877702248

model-00006-of-00007.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:cfe313a001266604ca15c4782c30c71f82e3312dae1034bcec7cc4623d9ef2ab
+size 4877702248

model-00007-of-00007.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:8e4bef730ddab35c068267cf78fd7f385bbe480528d2d485e87a9efba7a4e92a
+size 4908583200

model.safetensors.index.json CHANGED Viewed

The diff for this file is too large to render. See raw diff