burtenshaw
/

Qwen3-30B-A3B-python-coder

Text Generation

Generated from Trainer

Model card Files Files and versions Community

burtenshaw HF Staff commited on May 2

Commit

02a8cd1

·

verified ·

1 Parent(s): 4ecc585

Upload train.py with huggingface_hub

Files changed (1) hide show

train.py +6 -6

train.py CHANGED Viewed

@@ -71,11 +71,11 @@ learning_rate = 2e-4
 """## Load model and tokenizer"""
 # specify how to quantize the model
-quantization_config = BitsAndBytesConfig(
-        load_in_4bit=True,
-        bnb_4bit_quant_type="nf4",
-        bnb_4bit_use_double_quant=True,
-)
 # Load model
 model = AutoModelForCausalLM.from_pretrained(
@@ -83,7 +83,7 @@ model = AutoModelForCausalLM.from_pretrained(
     torch_dtype=torch.bfloat16,
     use_cache=False,  # Disable KV cache during training
     device_map="auto",
-    quantization_config=quantization_config
 )
 # Load tokenizer

 """## Load model and tokenizer"""
 # specify how to quantize the model
+# quantization_config = BitsAndBytesConfig(
+#         load_in_4bit=True,
+#         bnb_4bit_quant_type="nf4",
+#         bnb_4bit_use_double_quant=True,
+# )
 # Load model
 model = AutoModelForCausalLM.from_pretrained(
     torch_dtype=torch.bfloat16,
     use_cache=False,  # Disable KV cache during training
     device_map="auto",
+    # quantization_config=quantization_config
 )
 # Load tokenizer