qgallouedec HF Staff commited on
Commit
82a8da7
·
1 Parent(s): 4d346dc
configs/Qwen3-4B-Base_a10g-small.yaml CHANGED
@@ -1,5 +1,5 @@
1
  # Model arguments
2
- model_name_or_path: Qwen/Qwen2.5-0.5B
3
  model_revision: main
4
  torch_dtype: bfloat16
5
  attn_implementation: flash_attention_2
 
1
  # Model arguments
2
+ model_name_or_path: Qwen/Qwen2.5-1.5B
3
  model_revision: main
4
  torch_dtype: bfloat16
5
  attn_implementation: flash_attention_2