|
|
|
|
|
|
|
from transformers.models.olmoe.configuration_olmoe import OlmoeConfig |
|
|
|
class DenseBackwardOLMoEConfig(OlmoeConfig): |
|
model_type = "DenseBackward_olmoe" |
|
|
|
|
|
auto_map = { |
|
"AutoConfig": "configuration_custom.DenseBackwardOLMoEConfig", |
|
"AutoModelForCausalLM": "modeling_custom.DenseBackwardOLMoEForCausalLM" |
|
} |
|
|
|
def __init__(self, model_marker="DenseBackward_olmoe_marker", **kwargs): |
|
super().__init__(**kwargs) |
|
self.model_marker = model_marker |
|
self.intermediate_size= 1024 |
|
|
|
def main(): |
|
config = DenseBackwardOLMoEConfig(model_marker="DenseBackward_olmoe_marker") |
|
print(config) |
|
|
|
if __name__ == "__main__": |
|
main() |