Commit
·
82a8da7
1
Parent(s):
4d346dc
1.5
Browse files
configs/Qwen3-4B-Base_a10g-small.yaml
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
# Model arguments
|
2 |
-
model_name_or_path: Qwen/Qwen2.5-
|
3 |
model_revision: main
|
4 |
torch_dtype: bfloat16
|
5 |
attn_implementation: flash_attention_2
|
|
|
1 |
# Model arguments
|
2 |
+
model_name_or_path: Qwen/Qwen2.5-1.5B
|
3 |
model_revision: main
|
4 |
torch_dtype: bfloat16
|
5 |
attn_implementation: flash_attention_2
|