Update README.md
Browse files
README.md
CHANGED
@@ -16,7 +16,9 @@ TRL supports the DPO Trainer for training language models from preference data,
|
|
16 |
target_modules=[ "gate_proj", "up_proj", "down_proj"]
|
17 |
|
18 |
```
|
19 |
-
sample
|
|
|
|
|
20 |
from transformers import AutoTokenizer, AutoModelForCausalLM
|
21 |
import math
|
22 |
|
@@ -40,4 +42,3 @@ while len(prompt) > 0:
|
|
40 |
|
41 |
```
|
42 |
|
43 |
-
```
|
|
|
16 |
target_modules=[ "gate_proj", "up_proj", "down_proj"]
|
17 |
|
18 |
```
|
19 |
+
sample code
|
20 |
+
```
|
21 |
+
import torch
|
22 |
from transformers import AutoTokenizer, AutoModelForCausalLM
|
23 |
import math
|
24 |
|
|
|
42 |
|
43 |
```
|
44 |
|
|