Update generate.py
Browse files- generate.py +3 -3
generate.py
CHANGED
@@ -130,8 +130,8 @@ def generate(
|
|
130 |
forced_eos_token_id= False,
|
131 |
remove_invalid_values=None,
|
132 |
synced_gpus=None,
|
133 |
-
n_ahead=
|
134 |
-
n_ahead_talk=
|
135 |
merged_talk_heads=True,
|
136 |
merged_lm_and_talk_heads=False,
|
137 |
merged_lm_and_think_heads=True,
|
@@ -161,7 +161,7 @@ def generate(
|
|
161 |
self.use_end_thought_token = True
|
162 |
self.use_start_thought_token = True
|
163 |
self.n_ahead = n_ahead
|
164 |
-
self.n_passes =
|
165 |
self.eval_mode = True
|
166 |
self.first_run = False
|
167 |
self.rm_initialized = True
|
|
|
130 |
forced_eos_token_id= False,
|
131 |
remove_invalid_values=None,
|
132 |
synced_gpus=None,
|
133 |
+
n_ahead=12,
|
134 |
+
n_ahead_talk=4,
|
135 |
merged_talk_heads=True,
|
136 |
merged_lm_and_talk_heads=False,
|
137 |
merged_lm_and_think_heads=True,
|
|
|
161 |
self.use_end_thought_token = True
|
162 |
self.use_start_thought_token = True
|
163 |
self.n_ahead = n_ahead
|
164 |
+
self.n_passes = 2
|
165 |
self.eval_mode = True
|
166 |
self.first_run = False
|
167 |
self.rm_initialized = True
|