{ "activation_hidden_dim": 384, "architectures": [ "PicoDecoderHF" ], "attention_n_heads": 12, "attention_n_kv_heads": 4, "auto_map": { "AutoConfig": "pico_decoder.PicoDecoderHFConfig", "AutoModelForCausalLM": "pico_decoder.PicoDecoderHF" }, "batch_size": 1024, "d_model": 96, "max_seq_len": 2048, "model_type": "pico_decoder", "n_layers": 12, "norm_eps": 1e-06, "position_emb_theta": 10000.0, "torch_dtype": "float32", "transformers_version": "4.48.1", "vocab_size": 50304 }