deepseek-v4-mini-1B-from-flash / frozen_keys.json
kshitijthakkar's picture
Partial slice from deepseek-ai/DeepSeek-V4-Flash (16/27 shards)
0073e98 verified
[
"layers.0.hc_attn_base",
"layers.0.hc_attn_scale",
"layers.0.hc_ffn_base",
"layers.0.hc_ffn_scale",
"layers.1.hc_attn_base",
"layers.1.hc_attn_scale",
"layers.1.hc_ffn_base",
"layers.1.hc_ffn_scale",
"layers.2.hc_attn_base",
"layers.2.hc_attn_scale",
"layers.2.hc_ffn_base",
"layers.2.hc_ffn_scale",
"layers.3.hc_attn_base",
"layers.3.hc_attn_scale",
"layers.3.hc_ffn_base",
"layers.3.hc_ffn_scale",
"layers.4.hc_attn_base",
"layers.4.hc_attn_scale",
"layers.4.hc_ffn_base",
"layers.4.hc_ffn_scale",
"layers.5.hc_attn_base",
"layers.5.hc_attn_scale",
"layers.5.hc_ffn_base",
"layers.5.hc_ffn_scale",
"layers.6.hc_attn_base",
"layers.6.hc_attn_scale",
"layers.6.hc_ffn_base",
"layers.6.hc_ffn_scale",
"layers.7.hc_attn_base",
"layers.7.hc_attn_scale",
"layers.7.hc_ffn_base",
"layers.7.hc_ffn_scale",
"layers.8.hc_attn_base",
"layers.8.hc_attn_scale",
"layers.8.hc_ffn_base",
"layers.8.hc_ffn_scale",
"layers.9.hc_attn_base",
"layers.9.hc_attn_scale",
"layers.9.hc_ffn_base",
"layers.9.hc_ffn_scale",
"layers.10.hc_attn_base",
"layers.10.hc_attn_scale",
"layers.10.hc_ffn_base",
"layers.10.hc_ffn_scale",
"layers.11.hc_attn_base",
"layers.11.hc_attn_scale",
"layers.11.hc_ffn_base",
"layers.11.hc_ffn_scale",
"layers.12.hc_attn_base",
"layers.12.hc_attn_scale",
"layers.12.hc_ffn_base",
"layers.12.hc_ffn_scale",
"layers.13.hc_attn_base",
"layers.13.hc_attn_scale",
"layers.13.hc_ffn_base",
"layers.13.hc_ffn_scale",
"layers.14.hc_attn_base",
"layers.14.hc_attn_scale",
"layers.14.hc_ffn_base",
"layers.14.hc_ffn_scale"
]