rwkv7-168M-pile / config.json
ZhangRC's picture
Update config.json
60d1501 verified
raw
history blame contribute delete
964 Bytes
{
"_attn_implementation_autoset": true,
"a_low_rank_dim": 64,
"architectures": [
"RWKV7ForCausalLM"
],
"attn": null,
"attn_mode": "chunk",
"auto_map": {
"AutoConfig": "modeling_rwkv7.RWKV7Config",
"AutoModel": "modeling_rwkv7.RWKV7Model",
"AutoModelForCausalLM": "modeling_rwkv7.RWKV7ForCausalLM"
},
"bos_token_id": 0,
"decay_low_rank_dim": 64,
"eos_token_id": 0,
"fuse_cross_entropy": true,
"fuse_norm": true,
"gate_low_rank_dim": 128,
"head_dim": 64,
"hidden_act": "sqrelu",
"hidden_ratio": 4.0,
"hidden_size": 768,
"initializer_range": 0.02,
"intermediate_size": 3072,
"max_position_embeddings": 2048,
"model_type": "rwkv7",
"norm_bias": true,
"norm_eps": 1e-05,
"norm_first": true,
"num_heads": null,
"num_hidden_layers": 12,
"tie_word_embeddings": false,
"torch_dtype": "double",
"transformers_version": "4.48.0",
"use_cache": true,
"v_low_rank_dim": 32,
"vocab_size": 50304
}