Update modeling_densebackward_olmoe0125.py
Browse files
modeling_densebackward_olmoe0125.py
CHANGED
@@ -115,6 +115,12 @@ class DenseBackwardOLMoEForCausalLM(OlmoeForCausalLM):
|
|
115 |
new_block.norm_topk_prob = orig_block.norm_topk_prob
|
116 |
layer.mlp = new_block
|
117 |
print(type(layer.mlp))
|
|
|
|
|
|
|
|
|
|
|
|
|
118 |
|
119 |
def main():
|
120 |
config = DenseBackwardOLMoEConfig( # 官方模型参数
|
|
|
115 |
new_block.norm_topk_prob = orig_block.norm_topk_prob
|
116 |
layer.mlp = new_block
|
117 |
print(type(layer.mlp))
|
118 |
+
# 释放预训练模型内存
|
119 |
+
del pretrained_model
|
120 |
+
import gc
|
121 |
+
gc.collect()
|
122 |
+
torch.cuda.empty_cache()
|
123 |
+
print("原始预训练模型已释放")
|
124 |
|
125 |
def main():
|
126 |
config = DenseBackwardOLMoEConfig( # 官方模型参数
|