latest
2.5GB
minicpm3_4b-ggml-model-Q4_K_M.gguf
268 Pulls Updated 2 weeks ago
430bdaab37af · 2.5GB
-
general.architectureminicpm3
-
general.file_typeQ4_K_M
-
minicpm3.attention.head_count40
-
minicpm3.attention.head_count_kv40
-
minicpm3.attention.key_length96
-
minicpm3.attention.kv_lora_rank256
-
minicpm3.attention.layer_norm_rms_epsilon1e-05
-
minicpm3.attention.q_lora_rank768
-
minicpm3.block_count62
-
minicpm3.context_length32768
-
minicpm3.embedding_length2560
-
minicpm3.feed_forward_length6400
-
minicpm3.rope.dimension_count32
-
minicpm3.vocab_size73448
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id73440
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000 -1000 -1000 -1000 -1000 ...]
-
tokenizer.ggml.token_type[3 3 1 1 1 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> <SEP> <CLS> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ6_K[2560 73448]
-
blk.0.attn_norm.weightF32[2560]
-
blk.0.attn_q_b.weightQ4_K[768 3840]
-
blk.0.attn_q_a.weightQ4_K[2560 768]
-
blk.0.attn_kv_b.weightQ4_K[256 5120]
-
blk.0.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.0.attn_q_a_norm.weightF32[768]
-
blk.0.attn_kv_a_norm.weightF32[256]
-
blk.0.attn_output.weightQ4_K[2560 2560]
-
blk.0.ffn_norm.weightF32[2560]
-
blk.0.ffn_gate.weightQ4_K[2560 6400]
-
blk.0.ffn_up.weightQ4_K[2560 6400]
-
blk.0.ffn_down.weightQ6_K[6400 2560]
-
blk.1.attn_norm.weightF32[2560]
-
blk.1.attn_q_b.weightQ4_K[768 3840]
-
blk.1.attn_q_a.weightQ4_K[2560 768]
-
blk.1.attn_kv_b.weightQ4_K[256 5120]
-
blk.1.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.1.attn_q_a_norm.weightF32[768]
-
blk.1.attn_kv_a_norm.weightF32[256]
-
blk.1.attn_output.weightQ4_K[2560 2560]
-
blk.1.ffn_norm.weightF32[2560]
-
blk.1.ffn_gate.weightQ4_K[2560 6400]
-
blk.1.ffn_up.weightQ4_K[2560 6400]
-
blk.1.ffn_down.weightQ6_K[6400 2560]
-
blk.2.attn_norm.weightF32[2560]
-
blk.2.attn_q_b.weightQ4_K[768 3840]
-
blk.2.attn_q_a.weightQ4_K[2560 768]
-
blk.2.attn_kv_b.weightQ4_K[256 5120]
-
blk.2.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.2.attn_q_a_norm.weightF32[768]
-
blk.2.attn_kv_a_norm.weightF32[256]
-
blk.2.attn_output.weightQ4_K[2560 2560]
-
blk.2.ffn_norm.weightF32[2560]
-
blk.2.ffn_gate.weightQ4_K[2560 6400]
-
blk.2.ffn_up.weightQ4_K[2560 6400]
-
blk.2.ffn_down.weightQ6_K[6400 2560]
-
blk.3.attn_norm.weightF32[2560]
-
blk.3.attn_q_b.weightQ4_K[768 3840]
-
blk.3.attn_q_a.weightQ4_K[2560 768]
-
blk.3.attn_kv_b.weightQ4_K[256 5120]
-
blk.3.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.3.attn_q_a_norm.weightF32[768]
-
blk.3.attn_kv_a_norm.weightF32[256]
-
blk.3.attn_output.weightQ4_K[2560 2560]
-
blk.3.ffn_norm.weightF32[2560]
-
blk.3.ffn_gate.weightQ4_K[2560 6400]
-
blk.3.ffn_up.weightQ4_K[2560 6400]
-
blk.3.ffn_down.weightQ6_K[6400 2560]
-
blk.4.attn_norm.weightF32[2560]
-
blk.4.attn_q_b.weightQ4_K[768 3840]
-
blk.4.attn_q_a.weightQ4_K[2560 768]
-
blk.4.attn_kv_b.weightQ4_K[256 5120]
-
blk.4.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.4.attn_q_a_norm.weightF32[768]
-
blk.4.attn_kv_a_norm.weightF32[256]
-
blk.4.attn_output.weightQ4_K[2560 2560]
-
blk.4.ffn_norm.weightF32[2560]
-
blk.4.ffn_gate.weightQ4_K[2560 6400]
-
blk.4.ffn_up.weightQ4_K[2560 6400]
-
blk.4.ffn_down.weightQ6_K[6400 2560]
-
blk.5.attn_norm.weightF32[2560]
-
blk.5.attn_q_b.weightQ4_K[768 3840]
-
blk.5.attn_q_a.weightQ4_K[2560 768]
-
blk.5.attn_kv_b.weightQ4_K[256 5120]
-
blk.5.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.5.attn_q_a_norm.weightF32[768]
-
blk.5.attn_kv_a_norm.weightF32[256]
-
blk.5.attn_output.weightQ4_K[2560 2560]
-
blk.5.ffn_norm.weightF32[2560]
-
blk.5.ffn_gate.weightQ4_K[2560 6400]
-
blk.5.ffn_up.weightQ4_K[2560 6400]
-
blk.5.ffn_down.weightQ6_K[6400 2560]
-
blk.6.attn_norm.weightF32[2560]
-
blk.6.attn_q_b.weightQ4_K[768 3840]
-
blk.6.attn_q_a.weightQ4_K[2560 768]
-
blk.6.attn_kv_b.weightQ4_K[256 5120]
-
blk.6.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.6.attn_q_a_norm.weightF32[768]
-
blk.6.attn_kv_a_norm.weightF32[256]
-
blk.6.attn_output.weightQ4_K[2560 2560]
-
blk.6.ffn_norm.weightF32[2560]
-
blk.6.ffn_gate.weightQ4_K[2560 6400]
-
blk.6.ffn_up.weightQ4_K[2560 6400]
-
blk.6.ffn_down.weightQ6_K[6400 2560]
-
blk.7.attn_norm.weightF32[2560]
-
blk.7.attn_q_b.weightQ4_K[768 3840]
-
blk.7.attn_q_a.weightQ4_K[2560 768]
-
blk.7.attn_kv_b.weightQ4_K[256 5120]
-
blk.7.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.7.attn_q_a_norm.weightF32[768]
-
blk.7.attn_kv_a_norm.weightF32[256]
-
blk.7.attn_output.weightQ4_K[2560 2560]
-
blk.7.ffn_norm.weightF32[2560]
-
blk.7.ffn_gate.weightQ4_K[2560 6400]
-
blk.7.ffn_up.weightQ4_K[2560 6400]
-
blk.7.ffn_down.weightQ4_K[6400 2560]
-
blk.8.attn_norm.weightF32[2560]
-
blk.8.attn_q_b.weightQ4_K[768 3840]
-
blk.8.attn_q_a.weightQ4_K[2560 768]
-
blk.8.attn_kv_b.weightQ4_K[256 5120]
-
blk.8.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.8.attn_q_a_norm.weightF32[768]
-
blk.8.attn_kv_a_norm.weightF32[256]
-
blk.8.attn_output.weightQ4_K[2560 2560]
-
blk.8.ffn_norm.weightF32[2560]
-
blk.8.ffn_gate.weightQ4_K[2560 6400]
-
blk.8.ffn_up.weightQ4_K[2560 6400]
-
blk.8.ffn_down.weightQ4_K[6400 2560]
-
blk.9.attn_norm.weightF32[2560]
-
blk.9.attn_q_b.weightQ4_K[768 3840]
-
blk.9.attn_q_a.weightQ4_K[2560 768]
-
blk.9.attn_kv_b.weightQ4_K[256 5120]
-
blk.9.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.9.attn_q_a_norm.weightF32[768]
-
blk.9.attn_kv_a_norm.weightF32[256]
-
blk.9.attn_output.weightQ4_K[2560 2560]
-
blk.9.ffn_norm.weightF32[2560]
-
blk.9.ffn_gate.weightQ4_K[2560 6400]
-
blk.9.ffn_up.weightQ4_K[2560 6400]
-
blk.9.ffn_down.weightQ6_K[6400 2560]
-
blk.10.attn_norm.weightF32[2560]
-
blk.10.attn_q_b.weightQ4_K[768 3840]
-
blk.10.attn_q_a.weightQ4_K[2560 768]
-
blk.10.attn_kv_b.weightQ4_K[256 5120]
-
blk.10.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.10.attn_q_a_norm.weightF32[768]
-
blk.10.attn_kv_a_norm.weightF32[256]
-
blk.10.attn_output.weightQ4_K[2560 2560]
-
blk.10.ffn_norm.weightF32[2560]
-
blk.10.ffn_gate.weightQ4_K[2560 6400]
-
blk.10.ffn_up.weightQ4_K[2560 6400]
-
blk.10.ffn_down.weightQ4_K[6400 2560]
-
blk.11.attn_norm.weightF32[2560]
-
blk.11.attn_q_b.weightQ4_K[768 3840]
-
blk.11.attn_q_a.weightQ4_K[2560 768]
-
blk.11.attn_kv_b.weightQ4_K[256 5120]
-
blk.11.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.11.attn_q_a_norm.weightF32[768]
-
blk.11.attn_kv_a_norm.weightF32[256]
-
blk.11.attn_output.weightQ4_K[2560 2560]
-
blk.11.ffn_norm.weightF32[2560]
-
blk.11.ffn_gate.weightQ4_K[2560 6400]
-
blk.11.ffn_up.weightQ4_K[2560 6400]
-
blk.11.ffn_down.weightQ4_K[6400 2560]
-
blk.12.attn_norm.weightF32[2560]
-
blk.12.attn_q_b.weightQ4_K[768 3840]
-
blk.12.attn_q_a.weightQ4_K[2560 768]
-
blk.12.attn_kv_b.weightQ4_K[256 5120]
-
blk.12.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.12.attn_q_a_norm.weightF32[768]
-
blk.12.attn_kv_a_norm.weightF32[256]
-
blk.12.attn_output.weightQ4_K[2560 2560]
-
blk.12.ffn_norm.weightF32[2560]
-
blk.12.ffn_gate.weightQ4_K[2560 6400]
-
blk.12.ffn_up.weightQ4_K[2560 6400]
-
blk.12.ffn_down.weightQ6_K[6400 2560]
-
blk.13.attn_norm.weightF32[2560]
-
blk.13.attn_q_b.weightQ4_K[768 3840]
-
blk.13.attn_q_a.weightQ4_K[2560 768]
-
blk.13.attn_kv_b.weightQ4_K[256 5120]
-
blk.13.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.13.attn_q_a_norm.weightF32[768]
-
blk.13.attn_kv_a_norm.weightF32[256]
-
blk.13.attn_output.weightQ4_K[2560 2560]
-
blk.13.ffn_norm.weightF32[2560]
-
blk.13.ffn_gate.weightQ4_K[2560 6400]
-
blk.13.ffn_up.weightQ4_K[2560 6400]
-
blk.13.ffn_down.weightQ4_K[6400 2560]
-
blk.14.attn_norm.weightF32[2560]
-
blk.14.attn_q_b.weightQ4_K[768 3840]
-
blk.14.attn_q_a.weightQ4_K[2560 768]
-
blk.14.attn_kv_b.weightQ4_K[256 5120]
-
blk.14.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.14.attn_q_a_norm.weightF32[768]
-
blk.14.attn_kv_a_norm.weightF32[256]
-
blk.14.attn_output.weightQ4_K[2560 2560]
-
blk.14.ffn_norm.weightF32[2560]
-
blk.14.ffn_gate.weightQ4_K[2560 6400]
-
blk.14.ffn_up.weightQ4_K[2560 6400]
-
blk.14.ffn_down.weightQ4_K[6400 2560]
-
blk.15.attn_norm.weightF32[2560]
-
blk.15.attn_q_b.weightQ4_K[768 3840]
-
blk.15.attn_q_a.weightQ4_K[2560 768]
-
blk.15.attn_kv_b.weightQ4_K[256 5120]
-
blk.15.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.15.attn_q_a_norm.weightF32[768]
-
blk.15.attn_kv_a_norm.weightF32[256]
-
blk.15.attn_output.weightQ4_K[2560 2560]
-
blk.15.ffn_norm.weightF32[2560]
-
blk.15.ffn_gate.weightQ4_K[2560 6400]
-
blk.15.ffn_up.weightQ4_K[2560 6400]
-
blk.15.ffn_down.weightQ6_K[6400 2560]
-
blk.16.attn_norm.weightF32[2560]
-
blk.16.attn_q_b.weightQ4_K[768 3840]
-
blk.16.attn_q_a.weightQ4_K[2560 768]
-
blk.16.attn_kv_b.weightQ4_K[256 5120]
-
blk.16.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.16.attn_q_a_norm.weightF32[768]
-
blk.16.attn_kv_a_norm.weightF32[256]
-
blk.16.attn_output.weightQ4_K[2560 2560]
-
blk.16.ffn_norm.weightF32[2560]
-
blk.16.ffn_gate.weightQ4_K[2560 6400]
-
blk.16.ffn_up.weightQ4_K[2560 6400]
-
blk.16.ffn_down.weightQ4_K[6400 2560]
-
blk.17.attn_norm.weightF32[2560]
-
blk.17.attn_q_b.weightQ4_K[768 3840]
-
blk.17.attn_q_a.weightQ4_K[2560 768]
-
blk.17.attn_kv_b.weightQ4_K[256 5120]
-
blk.17.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.17.attn_q_a_norm.weightF32[768]
-
blk.17.attn_kv_a_norm.weightF32[256]
-
blk.17.attn_output.weightQ4_K[2560 2560]
-
blk.17.ffn_norm.weightF32[2560]
-
blk.17.ffn_gate.weightQ4_K[2560 6400]
-
blk.17.ffn_up.weightQ4_K[2560 6400]
-
blk.17.ffn_down.weightQ4_K[6400 2560]
-
blk.18.attn_norm.weightF32[2560]
-
blk.18.attn_q_b.weightQ4_K[768 3840]
-
blk.18.attn_q_a.weightQ4_K[2560 768]
-
blk.18.attn_kv_b.weightQ4_K[256 5120]
-
blk.18.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.18.attn_q_a_norm.weightF32[768]
-
blk.18.attn_kv_a_norm.weightF32[256]
-
blk.18.attn_output.weightQ4_K[2560 2560]
-
blk.18.ffn_norm.weightF32[2560]
-
blk.18.ffn_gate.weightQ4_K[2560 6400]
-
blk.18.ffn_up.weightQ4_K[2560 6400]
-
blk.18.ffn_down.weightQ6_K[6400 2560]
-
blk.19.attn_norm.weightF32[2560]
-
blk.19.attn_q_b.weightQ4_K[768 3840]
-
blk.19.attn_q_a.weightQ4_K[2560 768]
-
blk.19.attn_kv_b.weightQ4_K[256 5120]
-
blk.19.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.19.attn_q_a_norm.weightF32[768]
-
blk.19.attn_kv_a_norm.weightF32[256]
-
blk.19.attn_output.weightQ4_K[2560 2560]
-
blk.19.ffn_norm.weightF32[2560]
-
blk.19.ffn_gate.weightQ4_K[2560 6400]
-
blk.19.ffn_up.weightQ4_K[2560 6400]
-
blk.19.ffn_down.weightQ4_K[6400 2560]
-
blk.20.attn_norm.weightF32[2560]
-
blk.20.attn_q_b.weightQ4_K[768 3840]
-
blk.20.attn_q_a.weightQ4_K[2560 768]
-
blk.20.attn_kv_b.weightQ4_K[256 5120]
-
blk.20.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.20.attn_q_a_norm.weightF32[768]
-
blk.20.attn_kv_a_norm.weightF32[256]
-
blk.20.attn_output.weightQ4_K[2560 2560]
-
blk.20.ffn_norm.weightF32[2560]
-
blk.20.ffn_gate.weightQ4_K[2560 6400]
-
blk.20.ffn_up.weightQ4_K[2560 6400]
-
blk.20.ffn_down.weightQ4_K[6400 2560]
-
blk.21.attn_norm.weightF32[2560]
-
blk.21.attn_q_b.weightQ4_K[768 3840]
-
blk.21.attn_q_a.weightQ4_K[2560 768]
-
blk.21.attn_kv_b.weightQ4_K[256 5120]
-
blk.21.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.21.attn_q_a_norm.weightF32[768]
-
blk.21.attn_kv_a_norm.weightF32[256]
-
blk.21.attn_output.weightQ4_K[2560 2560]
-
blk.21.ffn_norm.weightF32[2560]
-
blk.21.ffn_gate.weightQ4_K[2560 6400]
-
blk.21.ffn_up.weightQ4_K[2560 6400]
-
blk.21.ffn_down.weightQ6_K[6400 2560]
-
blk.22.attn_norm.weightF32[2560]
-
blk.22.attn_q_b.weightQ4_K[768 3840]
-
blk.22.attn_q_a.weightQ4_K[2560 768]
-
blk.22.attn_kv_b.weightQ4_K[256 5120]
-
blk.22.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.22.attn_q_a_norm.weightF32[768]
-
blk.22.attn_kv_a_norm.weightF32[256]
-
blk.22.attn_output.weightQ4_K[2560 2560]
-
blk.22.ffn_norm.weightF32[2560]
-
blk.22.ffn_gate.weightQ4_K[2560 6400]
-
blk.22.ffn_up.weightQ4_K[2560 6400]
-
blk.22.ffn_down.weightQ4_K[6400 2560]
-
blk.23.attn_norm.weightF32[2560]
-
blk.23.attn_q_b.weightQ4_K[768 3840]
-
blk.23.attn_q_a.weightQ4_K[2560 768]
-
blk.23.attn_kv_b.weightQ4_K[256 5120]
-
blk.23.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.23.attn_q_a_norm.weightF32[768]
-
blk.23.attn_kv_a_norm.weightF32[256]
-
blk.23.attn_output.weightQ4_K[2560 2560]
-
blk.23.ffn_norm.weightF32[2560]
-
blk.23.ffn_gate.weightQ4_K[2560 6400]
-
blk.23.ffn_up.weightQ4_K[2560 6400]
-
blk.23.ffn_down.weightQ4_K[6400 2560]
-
blk.24.attn_norm.weightF32[2560]
-
blk.24.attn_q_b.weightQ4_K[768 3840]
-
blk.24.attn_q_a.weightQ4_K[2560 768]
-
blk.24.attn_kv_b.weightQ4_K[256 5120]
-
blk.24.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.24.attn_q_a_norm.weightF32[768]
-
blk.24.attn_kv_a_norm.weightF32[256]
-
blk.24.attn_output.weightQ4_K[2560 2560]
-
blk.24.ffn_norm.weightF32[2560]
-
blk.24.ffn_gate.weightQ4_K[2560 6400]
-
blk.24.ffn_up.weightQ4_K[2560 6400]
-
blk.24.ffn_down.weightQ6_K[6400 2560]
-
blk.25.attn_norm.weightF32[2560]
-
blk.25.attn_q_b.weightQ4_K[768 3840]
-
blk.25.attn_q_a.weightQ4_K[2560 768]
-
blk.25.attn_kv_b.weightQ4_K[256 5120]
-
blk.25.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.25.attn_q_a_norm.weightF32[768]
-
blk.25.attn_kv_a_norm.weightF32[256]
-
blk.25.attn_output.weightQ4_K[2560 2560]
-
blk.25.ffn_norm.weightF32[2560]
-
blk.25.ffn_gate.weightQ4_K[2560 6400]
-
blk.25.ffn_up.weightQ4_K[2560 6400]
-
blk.25.ffn_down.weightQ4_K[6400 2560]
-
blk.26.attn_norm.weightF32[2560]
-
blk.26.attn_q_b.weightQ4_K[768 3840]
-
blk.26.attn_q_a.weightQ4_K[2560 768]
-
blk.26.attn_kv_b.weightQ4_K[256 5120]
-
blk.26.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.26.attn_q_a_norm.weightF32[768]
-
blk.26.attn_kv_a_norm.weightF32[256]
-
blk.26.attn_output.weightQ4_K[2560 2560]
-
blk.26.ffn_norm.weightF32[2560]
-
blk.26.ffn_gate.weightQ4_K[2560 6400]
-
blk.26.ffn_up.weightQ4_K[2560 6400]
-
blk.26.ffn_down.weightQ4_K[6400 2560]
-
blk.27.attn_norm.weightF32[2560]
-
blk.27.attn_q_b.weightQ4_K[768 3840]
-
blk.27.attn_q_a.weightQ4_K[2560 768]
-
blk.27.attn_kv_b.weightQ4_K[256 5120]
-
blk.27.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.27.attn_q_a_norm.weightF32[768]
-
blk.27.attn_kv_a_norm.weightF32[256]
-
blk.27.attn_output.weightQ4_K[2560 2560]
-
blk.27.ffn_norm.weightF32[2560]
-
blk.27.ffn_gate.weightQ4_K[2560 6400]
-
blk.27.ffn_up.weightQ4_K[2560 6400]
-
blk.27.ffn_down.weightQ6_K[6400 2560]
-
blk.28.attn_norm.weightF32[2560]
-
blk.28.attn_q_b.weightQ4_K[768 3840]
-
blk.28.attn_q_a.weightQ4_K[2560 768]
-
blk.28.attn_kv_b.weightQ4_K[256 5120]
-
blk.28.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.28.attn_q_a_norm.weightF32[768]
-
blk.28.attn_kv_a_norm.weightF32[256]
-
blk.28.attn_output.weightQ4_K[2560 2560]
-
blk.28.ffn_norm.weightF32[2560]
-
blk.28.ffn_gate.weightQ4_K[2560 6400]
-
blk.28.ffn_up.weightQ4_K[2560 6400]
-
blk.28.ffn_down.weightQ4_K[6400 2560]
-
blk.29.attn_norm.weightF32[2560]
-
blk.29.attn_q_b.weightQ4_K[768 3840]
-
blk.29.attn_q_a.weightQ4_K[2560 768]
-
blk.29.attn_kv_b.weightQ4_K[256 5120]
-
blk.29.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.29.attn_q_a_norm.weightF32[768]
-
blk.29.attn_kv_a_norm.weightF32[256]
-
blk.29.attn_output.weightQ4_K[2560 2560]
-
blk.29.ffn_norm.weightF32[2560]
-
blk.29.ffn_gate.weightQ4_K[2560 6400]
-
blk.29.ffn_up.weightQ4_K[2560 6400]
-
blk.29.ffn_down.weightQ4_K[6400 2560]
-
blk.30.attn_norm.weightF32[2560]
-
blk.30.attn_q_b.weightQ4_K[768 3840]
-
blk.30.attn_q_a.weightQ4_K[2560 768]
-
blk.30.attn_kv_b.weightQ4_K[256 5120]
-
blk.30.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.30.attn_q_a_norm.weightF32[768]
-
blk.30.attn_kv_a_norm.weightF32[256]
-
blk.30.attn_output.weightQ4_K[2560 2560]
-
blk.30.ffn_norm.weightF32[2560]
-
blk.30.ffn_gate.weightQ4_K[2560 6400]
-
blk.30.ffn_up.weightQ4_K[2560 6400]
-
blk.30.ffn_down.weightQ6_K[6400 2560]
-
blk.31.attn_norm.weightF32[2560]
-
blk.31.attn_q_b.weightQ4_K[768 3840]
-
blk.31.attn_q_a.weightQ4_K[2560 768]
-
blk.31.attn_kv_b.weightQ4_K[256 5120]
-
blk.31.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.31.attn_q_a_norm.weightF32[768]
-
blk.31.attn_kv_a_norm.weightF32[256]
-
blk.31.attn_output.weightQ4_K[2560 2560]
-
blk.31.ffn_norm.weightF32[2560]
-
blk.31.ffn_gate.weightQ4_K[2560 6400]
-
blk.31.ffn_up.weightQ4_K[2560 6400]
-
blk.31.ffn_down.weightQ4_K[6400 2560]
-
blk.32.attn_norm.weightF32[2560]
-
blk.32.attn_q_b.weightQ4_K[768 3840]
-
blk.32.attn_q_a.weightQ4_K[2560 768]
-
blk.32.attn_kv_b.weightQ4_K[256 5120]
-
blk.32.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.32.attn_q_a_norm.weightF32[768]
-
blk.32.attn_kv_a_norm.weightF32[256]
-
blk.32.attn_output.weightQ4_K[2560 2560]
-
blk.32.ffn_norm.weightF32[2560]
-
blk.32.ffn_gate.weightQ4_K[2560 6400]
-
blk.32.ffn_up.weightQ4_K[2560 6400]
-
blk.32.ffn_down.weightQ4_K[6400 2560]
-
blk.33.attn_norm.weightF32[2560]
-
blk.33.attn_q_b.weightQ4_K[768 3840]
-
blk.33.attn_q_a.weightQ4_K[2560 768]
-
blk.33.attn_kv_b.weightQ4_K[256 5120]
-
blk.33.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.33.attn_q_a_norm.weightF32[768]
-
blk.33.attn_kv_a_norm.weightF32[256]
-
blk.33.attn_output.weightQ4_K[2560 2560]
-
blk.33.ffn_norm.weightF32[2560]
-
blk.33.ffn_gate.weightQ4_K[2560 6400]
-
blk.33.ffn_up.weightQ4_K[2560 6400]
-
blk.33.ffn_down.weightQ6_K[6400 2560]
-
blk.34.attn_norm.weightF32[2560]
-
blk.34.attn_q_b.weightQ4_K[768 3840]
-
blk.34.attn_q_a.weightQ4_K[2560 768]
-
blk.34.attn_kv_b.weightQ4_K[256 5120]
-
blk.34.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.34.attn_q_a_norm.weightF32[768]
-
blk.34.attn_kv_a_norm.weightF32[256]
-
blk.34.attn_output.weightQ4_K[2560 2560]
-
blk.34.ffn_norm.weightF32[2560]
-
blk.34.ffn_gate.weightQ4_K[2560 6400]
-
blk.34.ffn_up.weightQ4_K[2560 6400]
-
blk.34.ffn_down.weightQ4_K[6400 2560]
-
blk.35.attn_norm.weightF32[2560]
-
blk.35.attn_q_b.weightQ4_K[768 3840]
-
blk.35.attn_q_a.weightQ4_K[2560 768]
-
blk.35.attn_kv_b.weightQ4_K[256 5120]
-
blk.35.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.35.attn_q_a_norm.weightF32[768]
-
blk.35.attn_kv_a_norm.weightF32[256]
-
blk.35.attn_output.weightQ4_K[2560 2560]
-
blk.35.ffn_norm.weightF32[2560]
-
blk.35.ffn_gate.weightQ4_K[2560 6400]
-
blk.35.ffn_up.weightQ4_K[2560 6400]
-
blk.35.ffn_down.weightQ4_K[6400 2560]
-
blk.36.attn_norm.weightF32[2560]
-
blk.36.attn_q_b.weightQ4_K[768 3840]
-
blk.36.attn_q_a.weightQ4_K[2560 768]
-
blk.36.attn_kv_b.weightQ4_K[256 5120]
-
blk.36.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.36.attn_q_a_norm.weightF32[768]
-
blk.36.attn_kv_a_norm.weightF32[256]
-
blk.36.attn_output.weightQ4_K[2560 2560]
-
blk.36.ffn_norm.weightF32[2560]
-
blk.36.ffn_gate.weightQ4_K[2560 6400]
-
blk.36.ffn_up.weightQ4_K[2560 6400]
-
blk.36.ffn_down.weightQ6_K[6400 2560]
-
blk.37.attn_norm.weightF32[2560]
-
blk.37.attn_q_b.weightQ4_K[768 3840]
-
blk.37.attn_q_a.weightQ4_K[2560 768]
-
blk.37.attn_kv_b.weightQ4_K[256 5120]
-
blk.37.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.37.attn_q_a_norm.weightF32[768]
-
blk.37.attn_kv_a_norm.weightF32[256]
-
blk.37.attn_output.weightQ4_K[2560 2560]
-
blk.37.ffn_norm.weightF32[2560]
-
blk.37.ffn_gate.weightQ4_K[2560 6400]
-
blk.37.ffn_up.weightQ4_K[2560 6400]
-
blk.37.ffn_down.weightQ4_K[6400 2560]
-
blk.38.attn_norm.weightF32[2560]
-
blk.38.attn_q_b.weightQ4_K[768 3840]
-
blk.38.attn_q_a.weightQ4_K[2560 768]
-
blk.38.attn_kv_b.weightQ4_K[256 5120]
-
blk.38.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.38.attn_q_a_norm.weightF32[768]
-
blk.38.attn_kv_a_norm.weightF32[256]
-
blk.38.attn_output.weightQ4_K[2560 2560]
-
blk.38.ffn_norm.weightF32[2560]
-
blk.38.ffn_gate.weightQ4_K[2560 6400]
-
blk.38.ffn_up.weightQ4_K[2560 6400]
-
blk.38.ffn_down.weightQ4_K[6400 2560]
-
blk.39.attn_norm.weightF32[2560]
-
blk.39.attn_q_b.weightQ4_K[768 3840]
-
blk.39.attn_q_a.weightQ4_K[2560 768]
-
blk.39.attn_kv_b.weightQ4_K[256 5120]
-
blk.39.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.39.attn_q_a_norm.weightF32[768]
-
blk.39.attn_kv_a_norm.weightF32[256]
-
blk.39.attn_output.weightQ4_K[2560 2560]
-
blk.39.ffn_norm.weightF32[2560]
-
blk.39.ffn_gate.weightQ4_K[2560 6400]
-
blk.39.ffn_up.weightQ4_K[2560 6400]
-
blk.39.ffn_down.weightQ6_K[6400 2560]
-
blk.40.attn_norm.weightF32[2560]
-
blk.40.attn_q_b.weightQ4_K[768 3840]
-
blk.40.attn_q_a.weightQ4_K[2560 768]
-
blk.40.attn_kv_b.weightQ4_K[256 5120]
-
blk.40.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.40.attn_q_a_norm.weightF32[768]
-
blk.40.attn_kv_a_norm.weightF32[256]
-
blk.40.attn_output.weightQ4_K[2560 2560]
-
blk.40.ffn_norm.weightF32[2560]
-
blk.40.ffn_gate.weightQ4_K[2560 6400]
-
blk.40.ffn_up.weightQ4_K[2560 6400]
-
blk.40.ffn_down.weightQ4_K[6400 2560]
-
blk.41.attn_norm.weightF32[2560]
-
blk.41.attn_q_b.weightQ4_K[768 3840]
-
blk.41.attn_q_a.weightQ4_K[2560 768]
-
blk.41.attn_kv_b.weightQ4_K[256 5120]
-
blk.41.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.41.attn_q_a_norm.weightF32[768]
-
blk.41.attn_kv_a_norm.weightF32[256]
-
blk.41.attn_output.weightQ4_K[2560 2560]
-
blk.41.ffn_norm.weightF32[2560]
-
blk.41.ffn_gate.weightQ4_K[2560 6400]
-
blk.41.ffn_up.weightQ4_K[2560 6400]
-
blk.41.ffn_down.weightQ4_K[6400 2560]
-
blk.42.attn_norm.weightF32[2560]
-
blk.42.attn_q_b.weightQ4_K[768 3840]
-
blk.42.attn_q_a.weightQ4_K[2560 768]
-
blk.42.attn_kv_b.weightQ4_K[256 5120]
-
blk.42.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.42.attn_q_a_norm.weightF32[768]
-
blk.42.attn_kv_a_norm.weightF32[256]
-
blk.42.attn_output.weightQ4_K[2560 2560]
-
blk.42.ffn_norm.weightF32[2560]
-
blk.42.ffn_gate.weightQ4_K[2560 6400]
-
blk.42.ffn_up.weightQ4_K[2560 6400]
-
blk.42.ffn_down.weightQ6_K[6400 2560]
-
blk.43.attn_norm.weightF32[2560]
-
blk.43.attn_q_b.weightQ4_K[768 3840]
-
blk.43.attn_q_a.weightQ4_K[2560 768]
-
blk.43.attn_kv_b.weightQ4_K[256 5120]
-
blk.43.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.43.attn_q_a_norm.weightF32[768]
-
blk.43.attn_kv_a_norm.weightF32[256]
-
blk.43.attn_output.weightQ4_K[2560 2560]
-
blk.43.ffn_norm.weightF32[2560]
-
blk.43.ffn_gate.weightQ4_K[2560 6400]
-
blk.43.ffn_up.weightQ4_K[2560 6400]
-
blk.43.ffn_down.weightQ4_K[6400 2560]
-
blk.44.attn_norm.weightF32[2560]
-
blk.44.attn_q_b.weightQ4_K[768 3840]
-
blk.44.attn_q_a.weightQ4_K[2560 768]
-
blk.44.attn_kv_b.weightQ4_K[256 5120]
-
blk.44.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.44.attn_q_a_norm.weightF32[768]
-
blk.44.attn_kv_a_norm.weightF32[256]
-
blk.44.attn_output.weightQ4_K[2560 2560]
-
blk.44.ffn_norm.weightF32[2560]
-
blk.44.ffn_gate.weightQ4_K[2560 6400]
-
blk.44.ffn_up.weightQ4_K[2560 6400]
-
blk.44.ffn_down.weightQ4_K[6400 2560]
-
blk.45.attn_norm.weightF32[2560]
-
blk.45.attn_q_b.weightQ4_K[768 3840]
-
blk.45.attn_q_a.weightQ4_K[2560 768]
-
blk.45.attn_kv_b.weightQ4_K[256 5120]
-
blk.45.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.45.attn_q_a_norm.weightF32[768]
-
blk.45.attn_kv_a_norm.weightF32[256]
-
blk.45.attn_output.weightQ4_K[2560 2560]
-
blk.45.ffn_norm.weightF32[2560]
-
blk.45.ffn_gate.weightQ4_K[2560 6400]
-
blk.45.ffn_up.weightQ4_K[2560 6400]
-
blk.45.ffn_down.weightQ6_K[6400 2560]
-
blk.46.attn_norm.weightF32[2560]
-
blk.46.attn_q_b.weightQ4_K[768 3840]
-
blk.46.attn_q_a.weightQ4_K[2560 768]
-
blk.46.attn_kv_b.weightQ4_K[256 5120]
-
blk.46.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.46.attn_q_a_norm.weightF32[768]
-
blk.46.attn_kv_a_norm.weightF32[256]
-
blk.46.attn_output.weightQ4_K[2560 2560]
-
blk.46.ffn_norm.weightF32[2560]
-
blk.46.ffn_gate.weightQ4_K[2560 6400]
-
blk.46.ffn_up.weightQ4_K[2560 6400]
-
blk.46.ffn_down.weightQ4_K[6400 2560]
-
blk.47.attn_norm.weightF32[2560]
-
blk.47.attn_q_b.weightQ4_K[768 3840]
-
blk.47.attn_q_a.weightQ4_K[2560 768]
-
blk.47.attn_kv_b.weightQ4_K[256 5120]
-
blk.47.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.47.attn_q_a_norm.weightF32[768]
-
blk.47.attn_kv_a_norm.weightF32[256]
-
blk.47.attn_output.weightQ4_K[2560 2560]
-
blk.47.ffn_norm.weightF32[2560]
-
blk.47.ffn_gate.weightQ4_K[2560 6400]
-
blk.47.ffn_up.weightQ4_K[2560 6400]
-
blk.47.ffn_down.weightQ4_K[6400 2560]
-
blk.48.attn_norm.weightF32[2560]
-
blk.48.attn_q_b.weightQ4_K[768 3840]
-
blk.48.attn_q_a.weightQ4_K[2560 768]
-
blk.48.attn_kv_b.weightQ4_K[256 5120]
-
blk.48.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.48.attn_q_a_norm.weightF32[768]
-
blk.48.attn_kv_a_norm.weightF32[256]
-
blk.48.attn_output.weightQ4_K[2560 2560]
-
blk.48.ffn_norm.weightF32[2560]
-
blk.48.ffn_gate.weightQ4_K[2560 6400]
-
blk.48.ffn_up.weightQ4_K[2560 6400]
-
blk.48.ffn_down.weightQ6_K[6400 2560]
-
blk.49.attn_norm.weightF32[2560]
-
blk.49.attn_q_b.weightQ4_K[768 3840]
-
blk.49.attn_q_a.weightQ4_K[2560 768]
-
blk.49.attn_kv_b.weightQ4_K[256 5120]
-
blk.49.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.49.attn_q_a_norm.weightF32[768]
-
blk.49.attn_kv_a_norm.weightF32[256]
-
blk.49.attn_output.weightQ4_K[2560 2560]
-
blk.49.ffn_norm.weightF32[2560]
-
blk.49.ffn_gate.weightQ4_K[2560 6400]
-
blk.49.ffn_up.weightQ4_K[2560 6400]
-
blk.49.ffn_down.weightQ4_K[6400 2560]
-
blk.50.attn_norm.weightF32[2560]
-
blk.50.attn_q_b.weightQ4_K[768 3840]
-
blk.50.attn_q_a.weightQ4_K[2560 768]
-
blk.50.attn_kv_b.weightQ4_K[256 5120]
-
blk.50.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.50.attn_q_a_norm.weightF32[768]
-
blk.50.attn_kv_a_norm.weightF32[256]
-
blk.50.attn_output.weightQ4_K[2560 2560]
-
blk.50.ffn_norm.weightF32[2560]
-
blk.50.ffn_gate.weightQ4_K[2560 6400]
-
blk.50.ffn_up.weightQ4_K[2560 6400]
-
blk.50.ffn_down.weightQ4_K[6400 2560]
-
blk.51.attn_norm.weightF32[2560]
-
blk.51.attn_q_b.weightQ4_K[768 3840]
-
blk.51.attn_q_a.weightQ4_K[2560 768]
-
blk.51.attn_kv_b.weightQ4_K[256 5120]
-
blk.51.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.51.attn_q_a_norm.weightF32[768]
-
blk.51.attn_kv_a_norm.weightF32[256]
-
blk.51.attn_output.weightQ4_K[2560 2560]
-
blk.51.ffn_norm.weightF32[2560]
-
blk.51.ffn_gate.weightQ4_K[2560 6400]
-
blk.51.ffn_up.weightQ4_K[2560 6400]
-
blk.51.ffn_down.weightQ6_K[6400 2560]
-
blk.52.attn_norm.weightF32[2560]
-
blk.52.attn_q_b.weightQ4_K[768 3840]
-
blk.52.attn_q_a.weightQ4_K[2560 768]
-
blk.52.attn_kv_b.weightQ4_K[256 5120]
-
blk.52.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.52.attn_q_a_norm.weightF32[768]
-
blk.52.attn_kv_a_norm.weightF32[256]
-
blk.52.attn_output.weightQ4_K[2560 2560]
-
blk.52.ffn_norm.weightF32[2560]
-
blk.52.ffn_gate.weightQ4_K[2560 6400]
-
blk.52.ffn_up.weightQ4_K[2560 6400]
-
blk.52.ffn_down.weightQ4_K[6400 2560]
-
blk.53.attn_norm.weightF32[2560]
-
blk.53.attn_q_b.weightQ4_K[768 3840]
-
blk.53.attn_q_a.weightQ4_K[2560 768]
-
blk.53.attn_kv_b.weightQ4_K[256 5120]
-
blk.53.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.53.attn_q_a_norm.weightF32[768]
-
blk.53.attn_kv_a_norm.weightF32[256]
-
blk.53.attn_output.weightQ4_K[2560 2560]
-
blk.53.ffn_norm.weightF32[2560]
-
blk.53.ffn_gate.weightQ4_K[2560 6400]
-
blk.53.ffn_up.weightQ4_K[2560 6400]
-
blk.53.ffn_down.weightQ4_K[6400 2560]
-
blk.54.attn_norm.weightF32[2560]
-
blk.54.attn_q_b.weightQ4_K[768 3840]
-
blk.54.attn_q_a.weightQ4_K[2560 768]
-
blk.54.attn_kv_b.weightQ4_K[256 5120]
-
blk.54.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.54.attn_q_a_norm.weightF32[768]
-
blk.54.attn_kv_a_norm.weightF32[256]
-
blk.54.attn_output.weightQ4_K[2560 2560]
-
blk.54.ffn_norm.weightF32[2560]
-
blk.54.ffn_gate.weightQ4_K[2560 6400]
-
blk.54.ffn_up.weightQ4_K[2560 6400]
-
blk.54.ffn_down.weightQ6_K[6400 2560]
-
blk.55.attn_norm.weightF32[2560]
-
blk.55.attn_q_b.weightQ4_K[768 3840]
-
blk.55.attn_q_a.weightQ4_K[2560 768]
-
blk.55.attn_kv_b.weightQ4_K[256 5120]
-
blk.55.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.55.attn_q_a_norm.weightF32[768]
-
blk.55.attn_kv_a_norm.weightF32[256]
-
blk.55.attn_output.weightQ4_K[2560 2560]
-
blk.55.ffn_norm.weightF32[2560]
-
blk.55.ffn_gate.weightQ4_K[2560 6400]
-
blk.55.ffn_up.weightQ4_K[2560 6400]
-
blk.55.ffn_down.weightQ6_K[6400 2560]
-
blk.56.attn_norm.weightF32[2560]
-
blk.56.attn_q_b.weightQ4_K[768 3840]
-
blk.56.attn_q_a.weightQ4_K[2560 768]
-
blk.56.attn_kv_b.weightQ4_K[256 5120]
-
blk.56.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.56.attn_q_a_norm.weightF32[768]
-
blk.56.attn_kv_a_norm.weightF32[256]
-
blk.56.attn_output.weightQ4_K[2560 2560]
-
blk.56.ffn_norm.weightF32[2560]
-
blk.56.ffn_gate.weightQ4_K[2560 6400]
-
blk.56.ffn_up.weightQ4_K[2560 6400]
-
blk.56.ffn_down.weightQ6_K[6400 2560]
-
blk.57.attn_norm.weightF32[2560]
-
blk.57.attn_q_b.weightQ4_K[768 3840]
-
blk.57.attn_q_a.weightQ4_K[2560 768]
-
blk.57.attn_kv_b.weightQ4_K[256 5120]
-
blk.57.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.57.attn_q_a_norm.weightF32[768]
-
blk.57.attn_kv_a_norm.weightF32[256]
-
blk.57.attn_output.weightQ4_K[2560 2560]
-
blk.57.ffn_norm.weightF32[2560]
-
blk.57.ffn_gate.weightQ4_K[2560 6400]
-
blk.57.ffn_up.weightQ4_K[2560 6400]
-
blk.57.ffn_down.weightQ6_K[6400 2560]
-
blk.58.attn_norm.weightF32[2560]
-
blk.58.attn_q_b.weightQ4_K[768 3840]
-
blk.58.attn_q_a.weightQ4_K[2560 768]
-
blk.58.attn_kv_b.weightQ4_K[256 5120]
-
blk.58.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.58.attn_q_a_norm.weightF32[768]
-
blk.58.attn_kv_a_norm.weightF32[256]
-
blk.58.attn_output.weightQ4_K[2560 2560]
-
blk.58.ffn_norm.weightF32[2560]
-
blk.58.ffn_gate.weightQ4_K[2560 6400]
-
blk.58.ffn_up.weightQ4_K[2560 6400]
-
blk.58.ffn_down.weightQ6_K[6400 2560]
-
blk.59.attn_norm.weightF32[2560]
-
blk.59.attn_q_b.weightQ4_K[768 3840]
-
blk.59.attn_q_a.weightQ4_K[2560 768]
-
blk.59.attn_kv_b.weightQ4_K[256 5120]
-
blk.59.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.59.attn_q_a_norm.weightF32[768]
-
blk.59.attn_kv_a_norm.weightF32[256]
-
blk.59.attn_output.weightQ4_K[2560 2560]
-
blk.59.ffn_norm.weightF32[2560]
-
blk.59.ffn_gate.weightQ4_K[2560 6400]
-
blk.59.ffn_up.weightQ4_K[2560 6400]
-
blk.59.ffn_down.weightQ6_K[6400 2560]
-
blk.60.attn_norm.weightF32[2560]
-
blk.60.attn_q_b.weightQ4_K[768 3840]
-
blk.60.attn_q_a.weightQ4_K[2560 768]
-
blk.60.attn_kv_b.weightQ4_K[256 5120]
-
blk.60.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.60.attn_q_a_norm.weightF32[768]
-
blk.60.attn_kv_a_norm.weightF32[256]
-
blk.60.attn_output.weightQ4_K[2560 2560]
-
blk.60.ffn_norm.weightF32[2560]
-
blk.60.ffn_gate.weightQ4_K[2560 6400]
-
blk.60.ffn_up.weightQ4_K[2560 6400]
-
blk.60.ffn_down.weightQ6_K[6400 2560]
-
blk.61.attn_norm.weightF32[2560]
-
blk.61.attn_q_b.weightQ4_K[768 3840]
-
blk.61.attn_q_a.weightQ4_K[2560 768]
-
blk.61.attn_kv_b.weightQ4_K[256 5120]
-
blk.61.attn_kv_a_mqa.weightQ4_K[2560 288]
-
blk.61.attn_q_a_norm.weightF32[768]
-
blk.61.attn_kv_a_norm.weightF32[256]
-
blk.61.attn_output.weightQ4_K[2560 2560]
-
blk.61.ffn_norm.weightF32[2560]
-
blk.61.ffn_gate.weightQ4_K[2560 6400]
-
blk.61.ffn_up.weightQ4_K[2560 6400]
-
blk.61.ffn_down.weightQ6_K[6400 2560]
-
output_norm.weightF32[2560]
-
rope_factors_long.weightF32[16]
-
rope_factors_short.weightF32[16]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61