Update modeling_densebackward_olmoe0125.py
Browse files
modeling_densebackward_olmoe0125.py
CHANGED
@@ -183,13 +183,6 @@ class DenseBackwardOLMoEForCausalLM(OlmoeForCausalLM):
|
|
183 |
new_block.norm_topk_prob = orig_block.norm_topk_prob
|
184 |
layer.mlp = new_block
|
185 |
print(type(layer.mlp))
|
186 |
-
# 在调用post_init()前
|
187 |
-
test_param = self.model.layers[0].mlp.experts[0].up_proj.weight.data[0, 0].item()
|
188 |
-
print(f"权重示例值(前): {test_param}")
|
189 |
-
self.post_init()
|
190 |
-
# 在调用post_init()后
|
191 |
-
test_param_after = self.model.layers[0].mlp.experts[0].up_proj.weight.data[0, 0].item()
|
192 |
-
print(f"权重示例值(后): {test_param_after}")
|
193 |
|
194 |
def main():
|
195 |
config = DenseBackwardOLMoEConfig( # 官方模型参数
|
|
|
183 |
new_block.norm_topk_prob = orig_block.norm_topk_prob
|
184 |
layer.mlp = new_block
|
185 |
print(type(layer.mlp))
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
186 |
|
187 |
def main():
|
188 |
config = DenseBackwardOLMoEConfig( # 官方模型参数
|