Around6827 commited on
Commit
265ea82
·
1 Parent(s): 4dd8e5b

Training in progress, epoch 1

Browse files
Files changed (4) hide show
  1. README.md +13 -0
  2. adapter_config.json +2 -2
  3. adapter_model.bin +1 -1
  4. training_args.bin +1 -1
README.md CHANGED
@@ -31,6 +31,18 @@ More information needed
31
  ## Training procedure
32
 
33
 
 
 
 
 
 
 
 
 
 
 
 
 
34
  The following `bitsandbytes` quantization config was used during training:
35
  - quant_method: bitsandbytes
36
  - load_in_8bit: True
@@ -65,6 +77,7 @@ The following hyperparameters were used during training:
65
 
66
  ### Framework versions
67
 
 
68
  - PEFT 0.6.0.dev0
69
  - Transformers 4.34.0.dev0
70
  - Pytorch 2.0.1+cu117
 
31
  ## Training procedure
32
 
33
 
34
+ The following `bitsandbytes` quantization config was used during training:
35
+ - quant_method: bitsandbytes
36
+ - load_in_8bit: True
37
+ - load_in_4bit: False
38
+ - llm_int8_threshold: 6.0
39
+ - llm_int8_skip_modules: None
40
+ - llm_int8_enable_fp32_cpu_offload: False
41
+ - llm_int8_has_fp16_weight: False
42
+ - bnb_4bit_quant_type: fp4
43
+ - bnb_4bit_use_double_quant: False
44
+ - bnb_4bit_compute_dtype: float32
45
+
46
  The following `bitsandbytes` quantization config was used during training:
47
  - quant_method: bitsandbytes
48
  - load_in_8bit: True
 
77
 
78
  ### Framework versions
79
 
80
+ - PEFT 0.6.0.dev0
81
  - PEFT 0.6.0.dev0
82
  - Transformers 4.34.0.dev0
83
  - Pytorch 2.0.1+cu117
adapter_config.json CHANGED
@@ -17,11 +17,11 @@
17
  "revision": null,
18
  "target_modules": [
19
  "gate_proj",
 
20
  "v_proj",
 
21
  "up_proj",
22
- "down_proj",
23
  "q_proj",
24
- "k_proj",
25
  "o_proj"
26
  ],
27
  "task_type": "CAUSAL_LM"
 
17
  "revision": null,
18
  "target_modules": [
19
  "gate_proj",
20
+ "down_proj",
21
  "v_proj",
22
+ "k_proj",
23
  "up_proj",
 
24
  "q_proj",
 
25
  "o_proj"
26
  ],
27
  "task_type": "CAUSAL_LM"
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:629b8b83267e82fc04c0f4dbae0aedb7ddd0d6b922cb5c2fcc758ac96964e943
3
  size 319977229
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad4ea2397138ed2d852004167835dbb64b00ba4100354b13d396654bc6e1ce5e
3
  size 319977229
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3fbb5692d84707ba0da73df5c8db6584484c9710f3dd89c322d18f3312498cb9
3
  size 4475
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17b8a61bed456f0e64f13280369796447b5a0eb70ef6f1bbaa8ff6c0edeefe45
3
  size 4475