latest
7.9GB
4B
303 Pulls Updated 4 months ago
f7504cc57e0f · 7.9GB
-
general.architectureqwen2
-
general.file_typeF16
-
qwen2.attention.head_count20
-
qwen2.attention.head_count_kv20
-
qwen2.attention.layer_norm_rms_epsilon1e-06
-
qwen2.block_count40
-
qwen2.context_length32768
-
qwen2.embedding_length2560
-
qwen2.feed_forward_length6912
-
qwen2.rope.freq_base5e+06
-
tokenizer.ggml.bos_token_id151643
-
tokenizer.ggml.eos_token_id151643
-
tokenizer.ggml.merges[Ġ Ġ ĠĠ ĠĠ i n Ġ t ĠĠĠĠ ĠĠĠĠ ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weightF16[2560 151936]
-
blk.0.attn_norm.weightF32[2560]
-
blk.0.ffn_down.weightF16[6912 2560]
-
blk.0.ffn_gate.weightF16[2560 6912]
-
blk.0.ffn_up.weightF16[2560 6912]
-
blk.0.ffn_norm.weightF32[2560]
-
blk.0.attn_k.biasF32[2560]
-
blk.0.attn_k.weightF16[2560 2560]
-
blk.0.attn_output.weightF16[2560 2560]
-
blk.0.attn_q.biasF32[2560]
-
blk.0.attn_q.weightF16[2560 2560]
-
blk.0.attn_v.biasF32[2560]
-
blk.0.attn_v.weightF16[2560 2560]
-
blk.1.attn_norm.weightF32[2560]
-
blk.1.ffn_down.weightF16[6912 2560]
-
blk.1.ffn_gate.weightF16[2560 6912]
-
blk.1.ffn_up.weightF16[2560 6912]
-
blk.1.ffn_norm.weightF32[2560]
-
blk.1.attn_k.biasF32[2560]
-
blk.1.attn_k.weightF16[2560 2560]
-
blk.1.attn_output.weightF16[2560 2560]
-
blk.1.attn_q.biasF32[2560]
-
blk.1.attn_q.weightF16[2560 2560]
-
blk.1.attn_v.biasF32[2560]
-
blk.1.attn_v.weightF16[2560 2560]
-
blk.2.attn_norm.weightF32[2560]
-
blk.2.ffn_down.weightF16[6912 2560]
-
blk.2.ffn_gate.weightF16[2560 6912]
-
blk.2.ffn_up.weightF16[2560 6912]
-
blk.2.ffn_norm.weightF32[2560]
-
blk.2.attn_k.biasF32[2560]
-
blk.2.attn_k.weightF16[2560 2560]
-
blk.2.attn_output.weightF16[2560 2560]
-
blk.2.attn_q.biasF32[2560]
-
blk.2.attn_q.weightF16[2560 2560]
-
blk.2.attn_v.biasF32[2560]
-
blk.2.attn_v.weightF16[2560 2560]
-
blk.3.attn_norm.weightF32[2560]
-
blk.3.ffn_down.weightF16[6912 2560]
-
blk.3.ffn_gate.weightF16[2560 6912]
-
blk.3.ffn_up.weightF16[2560 6912]
-
blk.3.ffn_norm.weightF32[2560]
-
blk.3.attn_k.biasF32[2560]
-
blk.3.attn_k.weightF16[2560 2560]
-
blk.3.attn_output.weightF16[2560 2560]
-
blk.3.attn_q.biasF32[2560]
-
blk.3.attn_q.weightF16[2560 2560]
-
blk.3.attn_v.biasF32[2560]
-
blk.3.attn_v.weightF16[2560 2560]
-
blk.4.attn_norm.weightF32[2560]
-
blk.4.ffn_down.weightF16[6912 2560]
-
blk.4.ffn_gate.weightF16[2560 6912]
-
blk.4.ffn_up.weightF16[2560 6912]
-
blk.4.ffn_norm.weightF32[2560]
-
blk.4.attn_k.biasF32[2560]
-
blk.4.attn_k.weightF16[2560 2560]
-
blk.4.attn_output.weightF16[2560 2560]
-
blk.4.attn_q.biasF32[2560]
-
blk.4.attn_q.weightF16[2560 2560]
-
blk.4.attn_v.biasF32[2560]
-
blk.4.attn_v.weightF16[2560 2560]
-
blk.5.attn_norm.weightF32[2560]
-
blk.5.ffn_down.weightF16[6912 2560]
-
blk.5.ffn_gate.weightF16[2560 6912]
-
blk.5.ffn_up.weightF16[2560 6912]
-
blk.5.ffn_norm.weightF32[2560]
-
blk.5.attn_k.biasF32[2560]
-
blk.5.attn_k.weightF16[2560 2560]
-
blk.5.attn_output.weightF16[2560 2560]
-
blk.5.attn_q.biasF32[2560]
-
blk.5.attn_q.weightF16[2560 2560]
-
blk.5.attn_v.biasF32[2560]
-
blk.5.attn_v.weightF16[2560 2560]
-
blk.6.attn_norm.weightF32[2560]
-
blk.6.ffn_down.weightF16[6912 2560]
-
blk.6.ffn_gate.weightF16[2560 6912]
-
blk.6.ffn_up.weightF16[2560 6912]
-
blk.6.ffn_norm.weightF32[2560]
-
blk.6.attn_k.biasF32[2560]
-
blk.6.attn_k.weightF16[2560 2560]
-
blk.6.attn_output.weightF16[2560 2560]
-
blk.6.attn_q.biasF32[2560]
-
blk.6.attn_q.weightF16[2560 2560]
-
blk.6.attn_v.biasF32[2560]
-
blk.6.attn_v.weightF16[2560 2560]
-
blk.7.attn_norm.weightF32[2560]
-
blk.7.ffn_down.weightF16[6912 2560]
-
blk.7.ffn_gate.weightF16[2560 6912]
-
blk.7.ffn_up.weightF16[2560 6912]
-
blk.7.ffn_norm.weightF32[2560]
-
blk.7.attn_k.biasF32[2560]
-
blk.7.attn_k.weightF16[2560 2560]
-
blk.7.attn_output.weightF16[2560 2560]
-
blk.7.attn_q.biasF32[2560]
-
blk.7.attn_q.weightF16[2560 2560]
-
blk.7.attn_v.biasF32[2560]
-
blk.7.attn_v.weightF16[2560 2560]
-
blk.8.attn_norm.weightF32[2560]
-
blk.8.ffn_down.weightF16[6912 2560]
-
blk.8.ffn_gate.weightF16[2560 6912]
-
blk.8.ffn_up.weightF16[2560 6912]
-
blk.8.ffn_norm.weightF32[2560]
-
blk.8.attn_k.biasF32[2560]
-
blk.8.attn_k.weightF16[2560 2560]
-
blk.8.attn_output.weightF16[2560 2560]
-
blk.8.attn_q.biasF32[2560]
-
blk.8.attn_q.weightF16[2560 2560]
-
blk.8.attn_v.biasF32[2560]
-
blk.8.attn_v.weightF16[2560 2560]
-
blk.9.attn_norm.weightF32[2560]
-
blk.9.ffn_down.weightF16[6912 2560]
-
blk.9.ffn_gate.weightF16[2560 6912]
-
blk.9.ffn_up.weightF16[2560 6912]
-
blk.9.ffn_norm.weightF32[2560]
-
blk.9.attn_k.biasF32[2560]
-
blk.9.attn_k.weightF16[2560 2560]
-
blk.9.attn_output.weightF16[2560 2560]
-
blk.9.attn_q.biasF32[2560]
-
blk.9.attn_q.weightF16[2560 2560]
-
blk.9.attn_v.biasF32[2560]
-
blk.9.attn_v.weightF16[2560 2560]
-
blk.10.attn_norm.weightF32[2560]
-
blk.10.ffn_down.weightF16[6912 2560]
-
blk.10.ffn_gate.weightF16[2560 6912]
-
blk.10.ffn_up.weightF16[2560 6912]
-
blk.10.ffn_norm.weightF32[2560]
-
blk.10.attn_k.biasF32[2560]
-
blk.10.attn_k.weightF16[2560 2560]
-
blk.10.attn_output.weightF16[2560 2560]
-
blk.10.attn_q.biasF32[2560]
-
blk.10.attn_q.weightF16[2560 2560]
-
blk.10.attn_v.biasF32[2560]
-
blk.10.attn_v.weightF16[2560 2560]
-
blk.11.attn_norm.weightF32[2560]
-
blk.11.ffn_down.weightF16[6912 2560]
-
blk.11.ffn_gate.weightF16[2560 6912]
-
blk.11.ffn_up.weightF16[2560 6912]
-
blk.11.ffn_norm.weightF32[2560]
-
blk.11.attn_k.biasF32[2560]
-
blk.11.attn_k.weightF16[2560 2560]
-
blk.11.attn_output.weightF16[2560 2560]
-
blk.11.attn_q.biasF32[2560]
-
blk.11.attn_q.weightF16[2560 2560]
-
blk.11.attn_v.biasF32[2560]
-
blk.11.attn_v.weightF16[2560 2560]
-
blk.12.attn_norm.weightF32[2560]
-
blk.12.ffn_down.weightF16[6912 2560]
-
blk.12.ffn_gate.weightF16[2560 6912]
-
blk.12.ffn_up.weightF16[2560 6912]
-
blk.12.ffn_norm.weightF32[2560]
-
blk.12.attn_k.biasF32[2560]
-
blk.12.attn_k.weightF16[2560 2560]
-
blk.12.attn_output.weightF16[2560 2560]
-
blk.12.attn_q.biasF32[2560]
-
blk.12.attn_q.weightF16[2560 2560]
-
blk.12.attn_v.biasF32[2560]
-
blk.12.attn_v.weightF16[2560 2560]
-
blk.13.attn_norm.weightF32[2560]
-
blk.13.ffn_down.weightF16[6912 2560]
-
blk.13.ffn_gate.weightF16[2560 6912]
-
blk.13.ffn_up.weightF16[2560 6912]
-
blk.13.ffn_norm.weightF32[2560]
-
blk.13.attn_k.biasF32[2560]
-
blk.13.attn_k.weightF16[2560 2560]
-
blk.13.attn_output.weightF16[2560 2560]
-
blk.13.attn_q.biasF32[2560]
-
blk.13.attn_q.weightF16[2560 2560]
-
blk.13.attn_v.biasF32[2560]
-
blk.13.attn_v.weightF16[2560 2560]
-
blk.14.attn_norm.weightF32[2560]
-
blk.14.ffn_down.weightF16[6912 2560]
-
blk.14.ffn_gate.weightF16[2560 6912]
-
blk.14.ffn_up.weightF16[2560 6912]
-
blk.14.ffn_norm.weightF32[2560]
-
blk.14.attn_k.biasF32[2560]
-
blk.14.attn_k.weightF16[2560 2560]
-
blk.14.attn_output.weightF16[2560 2560]
-
blk.14.attn_q.biasF32[2560]
-
blk.14.attn_q.weightF16[2560 2560]
-
blk.14.attn_v.biasF32[2560]
-
blk.14.attn_v.weightF16[2560 2560]
-
blk.15.attn_norm.weightF32[2560]
-
blk.15.ffn_down.weightF16[6912 2560]
-
blk.15.ffn_gate.weightF16[2560 6912]
-
blk.15.ffn_up.weightF16[2560 6912]
-
blk.15.ffn_norm.weightF32[2560]
-
blk.15.attn_k.biasF32[2560]
-
blk.15.attn_k.weightF16[2560 2560]
-
blk.15.attn_output.weightF16[2560 2560]
-
blk.15.attn_q.biasF32[2560]
-
blk.15.attn_q.weightF16[2560 2560]
-
blk.15.attn_v.biasF32[2560]
-
blk.15.attn_v.weightF16[2560 2560]
-
blk.16.attn_norm.weightF32[2560]
-
blk.16.ffn_down.weightF16[6912 2560]
-
blk.16.ffn_gate.weightF16[2560 6912]
-
blk.16.ffn_up.weightF16[2560 6912]
-
blk.16.ffn_norm.weightF32[2560]
-
blk.16.attn_k.biasF32[2560]
-
blk.16.attn_k.weightF16[2560 2560]
-
blk.16.attn_output.weightF16[2560 2560]
-
blk.16.attn_q.biasF32[2560]
-
blk.16.attn_q.weightF16[2560 2560]
-
blk.16.attn_v.biasF32[2560]
-
blk.16.attn_v.weightF16[2560 2560]
-
blk.17.attn_norm.weightF32[2560]
-
blk.17.ffn_down.weightF16[6912 2560]
-
blk.17.ffn_gate.weightF16[2560 6912]
-
blk.17.ffn_up.weightF16[2560 6912]
-
blk.17.ffn_norm.weightF32[2560]
-
blk.17.attn_k.biasF32[2560]
-
blk.17.attn_k.weightF16[2560 2560]
-
blk.17.attn_output.weightF16[2560 2560]
-
blk.17.attn_q.biasF32[2560]
-
blk.17.attn_q.weightF16[2560 2560]
-
blk.17.attn_v.biasF32[2560]
-
blk.17.attn_v.weightF16[2560 2560]
-
blk.18.attn_norm.weightF32[2560]
-
blk.18.ffn_down.weightF16[6912 2560]
-
blk.18.ffn_gate.weightF16[2560 6912]
-
blk.18.ffn_up.weightF16[2560 6912]
-
blk.18.ffn_norm.weightF32[2560]
-
blk.18.attn_k.biasF32[2560]
-
blk.18.attn_k.weightF16[2560 2560]
-
blk.18.attn_output.weightF16[2560 2560]
-
blk.18.attn_q.biasF32[2560]
-
blk.18.attn_q.weightF16[2560 2560]
-
blk.18.attn_v.biasF32[2560]
-
blk.18.attn_v.weightF16[2560 2560]
-
blk.19.attn_norm.weightF32[2560]
-
blk.19.ffn_down.weightF16[6912 2560]
-
blk.19.ffn_gate.weightF16[2560 6912]
-
blk.19.ffn_up.weightF16[2560 6912]
-
blk.19.ffn_norm.weightF32[2560]
-
blk.19.attn_k.biasF32[2560]
-
blk.19.attn_k.weightF16[2560 2560]
-
blk.19.attn_output.weightF16[2560 2560]
-
blk.19.attn_q.biasF32[2560]
-
blk.19.attn_q.weightF16[2560 2560]
-
blk.19.attn_v.biasF32[2560]
-
blk.19.attn_v.weightF16[2560 2560]
-
blk.20.attn_norm.weightF32[2560]
-
blk.20.ffn_down.weightF16[6912 2560]
-
blk.20.ffn_gate.weightF16[2560 6912]
-
blk.20.ffn_up.weightF16[2560 6912]
-
blk.20.ffn_norm.weightF32[2560]
-
blk.20.attn_k.biasF32[2560]
-
blk.20.attn_k.weightF16[2560 2560]
-
blk.20.attn_output.weightF16[2560 2560]
-
blk.20.attn_q.biasF32[2560]
-
blk.20.attn_q.weightF16[2560 2560]
-
blk.20.attn_v.biasF32[2560]
-
blk.20.attn_v.weightF16[2560 2560]
-
blk.21.attn_norm.weightF32[2560]
-
blk.21.ffn_down.weightF16[6912 2560]
-
blk.21.ffn_gate.weightF16[2560 6912]
-
blk.21.ffn_up.weightF16[2560 6912]
-
blk.21.ffn_norm.weightF32[2560]
-
blk.21.attn_k.biasF32[2560]
-
blk.21.attn_k.weightF16[2560 2560]
-
blk.21.attn_output.weightF16[2560 2560]
-
blk.21.attn_q.biasF32[2560]
-
blk.21.attn_q.weightF16[2560 2560]
-
blk.21.attn_v.biasF32[2560]
-
blk.21.attn_v.weightF16[2560 2560]
-
blk.22.attn_norm.weightF32[2560]
-
blk.22.ffn_down.weightF16[6912 2560]
-
blk.22.ffn_gate.weightF16[2560 6912]
-
blk.22.ffn_up.weightF16[2560 6912]
-
blk.22.ffn_norm.weightF32[2560]
-
blk.22.attn_k.biasF32[2560]
-
blk.22.attn_k.weightF16[2560 2560]
-
blk.22.attn_output.weightF16[2560 2560]
-
blk.22.attn_q.biasF32[2560]
-
blk.22.attn_q.weightF16[2560 2560]
-
blk.22.attn_v.biasF32[2560]
-
blk.22.attn_v.weightF16[2560 2560]
-
blk.23.attn_norm.weightF32[2560]
-
blk.23.ffn_down.weightF16[6912 2560]
-
blk.23.ffn_gate.weightF16[2560 6912]
-
blk.23.ffn_up.weightF16[2560 6912]
-
blk.23.ffn_norm.weightF32[2560]
-
blk.23.attn_k.biasF32[2560]
-
blk.23.attn_k.weightF16[2560 2560]
-
blk.23.attn_output.weightF16[2560 2560]
-
blk.23.attn_q.biasF32[2560]
-
blk.23.attn_q.weightF16[2560 2560]
-
blk.23.attn_v.biasF32[2560]
-
blk.23.attn_v.weightF16[2560 2560]
-
blk.24.attn_norm.weightF32[2560]
-
blk.24.ffn_down.weightF16[6912 2560]
-
blk.24.ffn_gate.weightF16[2560 6912]
-
blk.24.ffn_up.weightF16[2560 6912]
-
blk.24.ffn_norm.weightF32[2560]
-
blk.24.attn_k.biasF32[2560]
-
blk.24.attn_k.weightF16[2560 2560]
-
blk.24.attn_output.weightF16[2560 2560]
-
blk.24.attn_q.biasF32[2560]
-
blk.24.attn_q.weightF16[2560 2560]
-
blk.24.attn_v.biasF32[2560]
-
blk.24.attn_v.weightF16[2560 2560]
-
blk.25.attn_norm.weightF32[2560]
-
blk.25.ffn_down.weightF16[6912 2560]
-
blk.25.ffn_gate.weightF16[2560 6912]
-
blk.25.ffn_up.weightF16[2560 6912]
-
blk.25.ffn_norm.weightF32[2560]
-
blk.25.attn_k.biasF32[2560]
-
blk.25.attn_k.weightF16[2560 2560]
-
blk.25.attn_output.weightF16[2560 2560]
-
blk.25.attn_q.biasF32[2560]
-
blk.25.attn_q.weightF16[2560 2560]
-
blk.25.attn_v.biasF32[2560]
-
blk.25.attn_v.weightF16[2560 2560]
-
blk.26.ffn_gate.weightF16[2560 6912]
-
blk.26.attn_k.biasF32[2560]
-
blk.26.attn_k.weightF16[2560 2560]
-
blk.26.attn_output.weightF16[2560 2560]
-
blk.26.attn_q.biasF32[2560]
-
blk.26.attn_q.weightF16[2560 2560]
-
blk.26.attn_v.biasF32[2560]
-
blk.26.attn_v.weightF16[2560 2560]
-
blk.26.attn_norm.weightF32[2560]
-
blk.26.ffn_down.weightF16[6912 2560]
-
blk.26.ffn_up.weightF16[2560 6912]
-
blk.26.ffn_norm.weightF32[2560]
-
blk.27.attn_norm.weightF32[2560]
-
blk.27.ffn_down.weightF16[6912 2560]
-
blk.27.ffn_gate.weightF16[2560 6912]
-
blk.27.ffn_up.weightF16[2560 6912]
-
blk.27.ffn_norm.weightF32[2560]
-
blk.27.attn_k.biasF32[2560]
-
blk.27.attn_k.weightF16[2560 2560]
-
blk.27.attn_output.weightF16[2560 2560]
-
blk.27.attn_q.biasF32[2560]
-
blk.27.attn_q.weightF16[2560 2560]
-
blk.27.attn_v.biasF32[2560]
-
blk.27.attn_v.weightF16[2560 2560]
-
blk.28.attn_norm.weightF32[2560]
-
blk.28.ffn_down.weightF16[6912 2560]
-
blk.28.ffn_gate.weightF16[2560 6912]
-
blk.28.ffn_up.weightF16[2560 6912]
-
blk.28.ffn_norm.weightF32[2560]
-
blk.28.attn_k.biasF32[2560]
-
blk.28.attn_k.weightF16[2560 2560]
-
blk.28.attn_output.weightF16[2560 2560]
-
blk.28.attn_q.biasF32[2560]
-
blk.28.attn_q.weightF16[2560 2560]
-
blk.28.attn_v.biasF32[2560]
-
blk.28.attn_v.weightF16[2560 2560]
-
blk.29.attn_norm.weightF32[2560]
-
blk.29.ffn_down.weightF16[6912 2560]
-
blk.29.ffn_gate.weightF16[2560 6912]
-
blk.29.ffn_up.weightF16[2560 6912]
-
blk.29.ffn_norm.weightF32[2560]
-
blk.29.attn_k.biasF32[2560]
-
blk.29.attn_k.weightF16[2560 2560]
-
blk.29.attn_output.weightF16[2560 2560]
-
blk.29.attn_q.biasF32[2560]
-
blk.29.attn_q.weightF16[2560 2560]
-
blk.29.attn_v.biasF32[2560]
-
blk.29.attn_v.weightF16[2560 2560]
-
blk.30.attn_norm.weightF32[2560]
-
blk.30.ffn_down.weightF16[6912 2560]
-
blk.30.ffn_gate.weightF16[2560 6912]
-
blk.30.ffn_up.weightF16[2560 6912]
-
blk.30.ffn_norm.weightF32[2560]
-
blk.30.attn_k.biasF32[2560]
-
blk.30.attn_k.weightF16[2560 2560]
-
blk.30.attn_output.weightF16[2560 2560]
-
blk.30.attn_q.biasF32[2560]
-
blk.30.attn_q.weightF16[2560 2560]
-
blk.30.attn_v.biasF32[2560]
-
blk.30.attn_v.weightF16[2560 2560]
-
blk.31.attn_norm.weightF32[2560]
-
blk.31.ffn_down.weightF16[6912 2560]
-
blk.31.ffn_gate.weightF16[2560 6912]
-
blk.31.ffn_up.weightF16[2560 6912]
-
blk.31.ffn_norm.weightF32[2560]
-
blk.31.attn_k.biasF32[2560]
-
blk.31.attn_k.weightF16[2560 2560]
-
blk.31.attn_output.weightF16[2560 2560]
-
blk.31.attn_q.biasF32[2560]
-
blk.31.attn_q.weightF16[2560 2560]
-
blk.31.attn_v.biasF32[2560]
-
blk.31.attn_v.weightF16[2560 2560]
-
blk.32.attn_norm.weightF32[2560]
-
blk.32.ffn_down.weightF16[6912 2560]
-
blk.32.ffn_gate.weightF16[2560 6912]
-
blk.32.ffn_up.weightF16[2560 6912]
-
blk.32.ffn_norm.weightF32[2560]
-
blk.32.attn_k.biasF32[2560]
-
blk.32.attn_k.weightF16[2560 2560]
-
blk.32.attn_output.weightF16[2560 2560]
-
blk.32.attn_q.biasF32[2560]
-
blk.32.attn_q.weightF16[2560 2560]
-
blk.32.attn_v.biasF32[2560]
-
blk.32.attn_v.weightF16[2560 2560]
-
blk.33.attn_norm.weightF32[2560]
-
blk.33.ffn_down.weightF16[6912 2560]
-
blk.33.ffn_gate.weightF16[2560 6912]
-
blk.33.ffn_up.weightF16[2560 6912]
-
blk.33.ffn_norm.weightF32[2560]
-
blk.33.attn_k.biasF32[2560]
-
blk.33.attn_k.weightF16[2560 2560]
-
blk.33.attn_output.weightF16[2560 2560]
-
blk.33.attn_q.biasF32[2560]
-
blk.33.attn_q.weightF16[2560 2560]
-
blk.33.attn_v.biasF32[2560]
-
blk.33.attn_v.weightF16[2560 2560]
-
blk.34.attn_norm.weightF32[2560]
-
blk.34.ffn_down.weightF16[6912 2560]
-
blk.34.ffn_gate.weightF16[2560 6912]
-
blk.34.ffn_up.weightF16[2560 6912]
-
blk.34.ffn_norm.weightF32[2560]
-
blk.34.attn_k.biasF32[2560]
-
blk.34.attn_k.weightF16[2560 2560]
-
blk.34.attn_output.weightF16[2560 2560]
-
blk.34.attn_q.biasF32[2560]
-
blk.34.attn_q.weightF16[2560 2560]
-
blk.34.attn_v.biasF32[2560]
-
blk.34.attn_v.weightF16[2560 2560]
-
blk.35.attn_norm.weightF32[2560]
-
blk.35.ffn_down.weightF16[6912 2560]
-
blk.35.ffn_gate.weightF16[2560 6912]
-
blk.35.ffn_up.weightF16[2560 6912]
-
blk.35.ffn_norm.weightF32[2560]
-
blk.35.attn_k.biasF32[2560]
-
blk.35.attn_k.weightF16[2560 2560]
-
blk.35.attn_output.weightF16[2560 2560]
-
blk.35.attn_q.biasF32[2560]
-
blk.35.attn_q.weightF16[2560 2560]
-
blk.35.attn_v.biasF32[2560]
-
blk.35.attn_v.weightF16[2560 2560]
-
blk.36.attn_norm.weightF32[2560]
-
blk.36.ffn_down.weightF16[6912 2560]
-
blk.36.ffn_gate.weightF16[2560 6912]
-
blk.36.ffn_up.weightF16[2560 6912]
-
blk.36.ffn_norm.weightF32[2560]
-
blk.36.attn_k.biasF32[2560]
-
blk.36.attn_k.weightF16[2560 2560]
-
blk.36.attn_output.weightF16[2560 2560]
-
blk.36.attn_q.biasF32[2560]
-
blk.36.attn_q.weightF16[2560 2560]
-
blk.36.attn_v.biasF32[2560]
-
blk.36.attn_v.weightF16[2560 2560]
-
blk.37.attn_norm.weightF32[2560]
-
blk.37.ffn_down.weightF16[6912 2560]
-
blk.37.ffn_gate.weightF16[2560 6912]
-
blk.37.ffn_up.weightF16[2560 6912]
-
blk.37.ffn_norm.weightF32[2560]
-
blk.37.attn_k.biasF32[2560]
-
blk.37.attn_k.weightF16[2560 2560]
-
blk.37.attn_output.weightF16[2560 2560]
-
blk.37.attn_q.biasF32[2560]
-
blk.37.attn_q.weightF16[2560 2560]
-
blk.37.attn_v.biasF32[2560]
-
blk.37.attn_v.weightF16[2560 2560]
-
blk.38.attn_norm.weightF32[2560]
-
blk.38.ffn_down.weightF16[6912 2560]
-
blk.38.ffn_gate.weightF16[2560 6912]
-
blk.38.ffn_up.weightF16[2560 6912]
-
blk.38.ffn_norm.weightF32[2560]
-
blk.38.attn_k.biasF32[2560]
-
blk.38.attn_k.weightF16[2560 2560]
-
blk.38.attn_output.weightF16[2560 2560]
-
blk.38.attn_q.biasF32[2560]
-
blk.38.attn_q.weightF16[2560 2560]
-
blk.38.attn_v.biasF32[2560]
-
blk.38.attn_v.weightF16[2560 2560]
-
blk.39.attn_norm.weightF32[2560]
-
blk.39.ffn_down.weightF16[6912 2560]
-
blk.39.ffn_gate.weightF16[2560 6912]
-
blk.39.ffn_up.weightF16[2560 6912]
-
blk.39.ffn_norm.weightF32[2560]
-
blk.39.attn_k.biasF32[2560]
-
blk.39.attn_k.weightF16[2560 2560]
-
blk.39.attn_output.weightF16[2560 2560]
-
blk.39.attn_q.biasF32[2560]
-
blk.39.attn_q.weightF16[2560 2560]
-
blk.39.attn_v.biasF32[2560]
-
blk.39.attn_v.weightF16[2560 2560]
-
output.weightF16[2560 151936]
-
output_norm.weightF32[2560]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39