Update configuration_quiet.py
Browse files- configuration_quiet.py +2 -0
configuration_quiet.py
CHANGED
|
@@ -114,6 +114,7 @@ class QuietConfig(PretrainedConfig):
|
|
| 114 |
sliding_window=4096,
|
| 115 |
attention_dropout=0.0,
|
| 116 |
max_thoughts=16,
|
|
|
|
| 117 |
merged_talk_heads=True,
|
| 118 |
merged_lm_and_talk_heads=False,
|
| 119 |
merged_lm_and_think_heads=True,
|
|
@@ -146,6 +147,7 @@ class QuietConfig(PretrainedConfig):
|
|
| 146 |
self.rope_theta = rope_theta
|
| 147 |
self.attention_dropout = attention_dropout
|
| 148 |
self.max_thoughts = max_thoughts
|
|
|
|
| 149 |
self.merged_talk_heads = merged_talk_heads
|
| 150 |
self.merged_lm_and_talk_heads = merged_lm_and_talk_heads
|
| 151 |
self.merged_lm_and_think_heads = merged_lm_and_think_heads
|
|
|
|
| 114 |
sliding_window=4096,
|
| 115 |
attention_dropout=0.0,
|
| 116 |
max_thoughts=16,
|
| 117 |
+
max_temperature=1,
|
| 118 |
merged_talk_heads=True,
|
| 119 |
merged_lm_and_talk_heads=False,
|
| 120 |
merged_lm_and_think_heads=True,
|
|
|
|
| 147 |
self.rope_theta = rope_theta
|
| 148 |
self.attention_dropout = attention_dropout
|
| 149 |
self.max_thoughts = max_thoughts
|
| 150 |
+
self.max_temperature = max_temperature
|
| 151 |
self.merged_talk_heads = merged_talk_heads
|
| 152 |
self.merged_lm_and_talk_heads = merged_lm_and_talk_heads
|
| 153 |
self.merged_lm_and_think_heads = merged_lm_and_think_heads
|