{ "d_model": 2048, "fused_add_norm": true, "n_layer": 48, "pad_vocab_size_multiple": 1, "residual_in_fp32": true, "rms_norm": false, "ssm_cfg": {}, "vocab_size": 100008 }