Commit
·
c5d1a86
1
Parent(s):
f105b76
demo config and run trl sft
Browse files- configs/Qwen3-4B-Base_a10g-small.yaml +2 -0
- sft.py +4 -1
configs/Qwen3-4B-Base_a10g-small.yaml
CHANGED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
model_name_or_path: Qwen/Qwen2.5-0.5B
|
2 |
+
dataset_name: stanfordnlp/imdb
|
sft.py
CHANGED
@@ -1,6 +1,6 @@
|
|
1 |
#!/usr/bin/env python3
|
2 |
-
|
3 |
import argparse
|
|
|
4 |
|
5 |
parser = argparse.ArgumentParser(description="Demo script for the model.")
|
6 |
|
@@ -9,3 +9,6 @@ parser.add_argument("--dataset", type=str)
|
|
9 |
|
10 |
args = parser.parse_args()
|
11 |
print(f"Model: {args.model}, Dataset: {args.dataset}")
|
|
|
|
|
|
|
|
1 |
#!/usr/bin/env python3
|
|
|
2 |
import argparse
|
3 |
+
import subprocess
|
4 |
|
5 |
parser = argparse.ArgumentParser(description="Demo script for the model.")
|
6 |
|
|
|
9 |
|
10 |
args = parser.parse_args()
|
11 |
print(f"Model: {args.model}, Dataset: {args.dataset}")
|
12 |
+
|
13 |
+
# Run another Python script
|
14 |
+
subprocess.run(["trl", "sft", "--config", "configs/Qwen3-4B-Base_a10g-small.yaml"])
|