pico-decoder-small / config.json
rdiehlmartinez's picture
pico-decoder-small-1 trained to 100k steps
546d4d8
{
"activation_hidden_dim": 1536,
"architectures": [
"PicoDecoderHF"
],
"attention_n_heads": 12,
"attention_n_kv_heads": 4,
"auto_map": {
"AutoConfig": "pico_decoder.PicoDecoderHFConfig",
"AutoModelForCausalLM": "pico_decoder.PicoDecoderHF"
},
"batch_size": 1024,
"d_model": 384,
"max_seq_len": 2048,
"model_type": "pico_decoder",
"n_layers": 12,
"norm_eps": 1e-06,
"position_emb_theta": 10000.0,
"torch_dtype": "float32",
"transformers_version": "4.48.3",
"vocab_size": 50304
}