autoprogrammer commited on
Commit
2917b63
·
verified ·
1 Parent(s): c401025

Update modeling_densebackward_olmoe0125.py

Browse files
modeling_densebackward_olmoe0125.py CHANGED
@@ -115,6 +115,12 @@ class DenseBackwardOLMoEForCausalLM(OlmoeForCausalLM):
115
  new_block.norm_topk_prob = orig_block.norm_topk_prob
116
  layer.mlp = new_block
117
  print(type(layer.mlp))
 
 
 
 
 
 
118
 
119
  def main():
120
  config = DenseBackwardOLMoEConfig( # 官方模型参数
 
115
  new_block.norm_topk_prob = orig_block.norm_topk_prob
116
  layer.mlp = new_block
117
  print(type(layer.mlp))
118
+ # 释放预训练模型内存
119
+ del pretrained_model
120
+ import gc
121
+ gc.collect()
122
+ torch.cuda.empty_cache()
123
+ print("原始预训练模型已释放")
124
 
125
  def main():
126
  config = DenseBackwardOLMoEConfig( # 官方模型参数