cpt core 4
Browse files
scripts/cpt_core_model_4.py
CHANGED
@@ -29,10 +29,12 @@ print(f'{model=}')
|
|
29 |
model = FastLanguageModel.get_peft_model(
|
30 |
model,
|
31 |
r = 256, # Choose any number > 0 ! Suggested 8, 16, 32, 64, 128
|
32 |
-
target_modules = [
|
33 |
-
|
34 |
-
|
35 |
-
|
|
|
|
|
36 |
lora_alpha = 32,
|
37 |
lora_dropout = 0, # Supports any, but = 0 is optimized
|
38 |
bias = "none", # Supports any, but = "none" is optimized
|
|
|
29 |
model = FastLanguageModel.get_peft_model(
|
30 |
model,
|
31 |
r = 256, # Choose any number > 0 ! Suggested 8, 16, 32, 64, 128
|
32 |
+
target_modules = [
|
33 |
+
"q_proj", "k_proj", "v_proj", "o_proj",
|
34 |
+
"gate_proj",
|
35 |
+
"up_proj", "down_proj",
|
36 |
+
"embed_tokens", "lm_head",
|
37 |
+
],
|
38 |
lora_alpha = 32,
|
39 |
lora_dropout = 0, # Supports any, but = 0 is optimized
|
40 |
bias = "none", # Supports any, but = "none" is optimized
|