Mixtral_34Bx2_MoE_60B GGUF Q4_K_M
35 Pulls Updated 5 months ago
0ea4500fc0ad · 34GB
-
general.architecturellama
-
general.file_typeQ4_K_M
-
llama.attention.head_count56
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count60
-
llama.context_length200000
-
llama.embedding_length7168
-
llama.expert_count2
-
llama.expert_used_count2
-
llama.feed_forward_length20480
-
llama.rope.dimension_count128
-
llama.rope.freq_base5e+06
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.merges[`` ` ` `` -- > - -> -- - ...]
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id1
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[2 3 3 3 3 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> <|Human|> <|Assistant|> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ4_K[7168 64000]
-
blk.0.ffn_up.0.weightQ4_K[7168 20480]
-
blk.0.ffn_up.1.weightQ4_K[7168 20480]
-
blk.0.attn_norm.weightF32[7168]
-
blk.0.ffn_down.0.weightQ4_K[20480 7168]
-
blk.0.ffn_down.1.weightQ4_K[20480 7168]
-
blk.0.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.0.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.0.ffn_norm.weightF32[7168]
-
blk.0.attn_q.weightQ4_K[7168 7168]
-
blk.0.attn_k.weightQ4_K[7168 1024]
-
blk.0.attn_output.weightQ4_K[7168 7168]
-
blk.0.attn_v.weightQ6_K[7168 1024]
-
blk.0.ffn_gate_inp.weightF16[7168 2]
-
blk.1.ffn_up.0.weightQ4_K[7168 20480]
-
blk.1.ffn_up.1.weightQ4_K[7168 20480]
-
blk.1.attn_norm.weightF32[7168]
-
blk.1.ffn_down.0.weightQ4_K[20480 7168]
-
blk.1.ffn_down.1.weightQ4_K[20480 7168]
-
blk.1.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.1.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.1.ffn_norm.weightF32[7168]
-
blk.1.attn_q.weightQ4_K[7168 7168]
-
blk.1.attn_k.weightQ4_K[7168 1024]
-
blk.1.attn_output.weightQ4_K[7168 7168]
-
blk.1.attn_v.weightQ6_K[7168 1024]
-
blk.1.ffn_gate_inp.weightF16[7168 2]
-
blk.2.ffn_up.0.weightQ4_K[7168 20480]
-
blk.2.ffn_up.1.weightQ4_K[7168 20480]
-
blk.2.attn_norm.weightF32[7168]
-
blk.2.ffn_down.0.weightQ4_K[20480 7168]
-
blk.2.ffn_down.1.weightQ4_K[20480 7168]
-
blk.2.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.2.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.2.ffn_norm.weightF32[7168]
-
blk.2.attn_q.weightQ4_K[7168 7168]
-
blk.2.attn_k.weightQ4_K[7168 1024]
-
blk.2.attn_output.weightQ4_K[7168 7168]
-
blk.2.attn_v.weightQ6_K[7168 1024]
-
blk.2.ffn_gate_inp.weightF16[7168 2]
-
blk.3.ffn_up.0.weightQ4_K[7168 20480]
-
blk.3.ffn_up.1.weightQ4_K[7168 20480]
-
blk.3.attn_norm.weightF32[7168]
-
blk.3.ffn_down.0.weightQ4_K[20480 7168]
-
blk.3.ffn_down.1.weightQ4_K[20480 7168]
-
blk.3.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.3.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.3.ffn_norm.weightF32[7168]
-
blk.3.attn_q.weightQ4_K[7168 7168]
-
blk.3.attn_k.weightQ4_K[7168 1024]
-
blk.3.attn_output.weightQ4_K[7168 7168]
-
blk.3.attn_v.weightQ4_K[7168 1024]
-
blk.3.ffn_gate_inp.weightF16[7168 2]
-
blk.4.ffn_up.0.weightQ4_K[7168 20480]
-
blk.4.ffn_up.1.weightQ4_K[7168 20480]
-
blk.4.attn_norm.weightF32[7168]
-
blk.4.ffn_down.0.weightQ4_K[20480 7168]
-
blk.4.ffn_down.1.weightQ4_K[20480 7168]
-
blk.4.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.4.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.4.ffn_norm.weightF32[7168]
-
blk.4.attn_q.weightQ4_K[7168 7168]
-
blk.4.attn_k.weightQ4_K[7168 1024]
-
blk.4.attn_output.weightQ4_K[7168 7168]
-
blk.4.attn_v.weightQ4_K[7168 1024]
-
blk.4.ffn_gate_inp.weightF16[7168 2]
-
blk.5.ffn_up.0.weightQ4_K[7168 20480]
-
blk.5.ffn_up.1.weightQ4_K[7168 20480]
-
blk.5.attn_norm.weightF32[7168]
-
blk.5.ffn_down.0.weightQ4_K[20480 7168]
-
blk.5.ffn_down.1.weightQ4_K[20480 7168]
-
blk.5.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.5.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.5.ffn_norm.weightF32[7168]
-
blk.5.attn_q.weightQ4_K[7168 7168]
-
blk.5.attn_k.weightQ4_K[7168 1024]
-
blk.5.attn_output.weightQ4_K[7168 7168]
-
blk.5.attn_v.weightQ6_K[7168 1024]
-
blk.5.ffn_gate_inp.weightF16[7168 2]
-
blk.6.ffn_up.0.weightQ4_K[7168 20480]
-
blk.6.ffn_up.1.weightQ4_K[7168 20480]
-
blk.6.attn_norm.weightF32[7168]
-
blk.6.ffn_down.0.weightQ4_K[20480 7168]
-
blk.6.ffn_down.1.weightQ4_K[20480 7168]
-
blk.6.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.6.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.6.ffn_norm.weightF32[7168]
-
blk.6.attn_q.weightQ4_K[7168 7168]
-
blk.6.attn_k.weightQ4_K[7168 1024]
-
blk.6.attn_output.weightQ4_K[7168 7168]
-
blk.6.attn_v.weightQ6_K[7168 1024]
-
blk.6.ffn_gate_inp.weightF16[7168 2]
-
blk.7.ffn_up.0.weightQ4_K[7168 20480]
-
blk.7.ffn_up.1.weightQ4_K[7168 20480]
-
blk.7.attn_norm.weightF32[7168]
-
blk.7.ffn_down.0.weightQ4_K[20480 7168]
-
blk.7.ffn_down.1.weightQ4_K[20480 7168]
-
blk.7.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.7.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.7.ffn_norm.weightF32[7168]
-
blk.7.attn_q.weightQ4_K[7168 7168]
-
blk.7.attn_k.weightQ4_K[7168 1024]
-
blk.7.attn_output.weightQ4_K[7168 7168]
-
blk.7.attn_v.weightQ6_K[7168 1024]
-
blk.7.ffn_gate_inp.weightF16[7168 2]
-
blk.8.ffn_up.0.weightQ4_K[7168 20480]
-
blk.8.ffn_up.1.weightQ4_K[7168 20480]
-
blk.8.attn_norm.weightF32[7168]
-
blk.8.ffn_down.0.weightQ4_K[20480 7168]
-
blk.8.ffn_down.1.weightQ4_K[20480 7168]
-
blk.8.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.8.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.8.ffn_norm.weightF32[7168]
-
blk.8.attn_q.weightQ4_K[7168 7168]
-
blk.8.attn_k.weightQ4_K[7168 1024]
-
blk.8.attn_output.weightQ4_K[7168 7168]
-
blk.8.attn_v.weightQ6_K[7168 1024]
-
blk.8.ffn_gate_inp.weightF16[7168 2]
-
blk.9.ffn_up.0.weightQ4_K[7168 20480]
-
blk.9.ffn_up.1.weightQ4_K[7168 20480]
-
blk.9.attn_norm.weightF32[7168]
-
blk.9.ffn_down.0.weightQ4_K[20480 7168]
-
blk.9.ffn_down.1.weightQ4_K[20480 7168]
-
blk.9.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.9.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.9.ffn_norm.weightF32[7168]
-
blk.9.attn_q.weightQ4_K[7168 7168]
-
blk.9.attn_k.weightQ4_K[7168 1024]
-
blk.9.attn_output.weightQ4_K[7168 7168]
-
blk.9.attn_v.weightQ6_K[7168 1024]
-
blk.9.ffn_gate_inp.weightF16[7168 2]
-
blk.10.ffn_up.0.weightQ4_K[7168 20480]
-
blk.10.ffn_up.1.weightQ4_K[7168 20480]
-
blk.10.attn_norm.weightF32[7168]
-
blk.10.ffn_down.0.weightQ4_K[20480 7168]
-
blk.10.ffn_down.1.weightQ4_K[20480 7168]
-
blk.10.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.10.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.10.ffn_norm.weightF32[7168]
-
blk.10.attn_q.weightQ4_K[7168 7168]
-
blk.10.attn_k.weightQ4_K[7168 1024]
-
blk.10.attn_output.weightQ4_K[7168 7168]
-
blk.10.attn_v.weightQ6_K[7168 1024]
-
blk.10.ffn_gate_inp.weightF16[7168 2]
-
blk.11.ffn_up.0.weightQ4_K[7168 20480]
-
blk.11.ffn_up.1.weightQ4_K[7168 20480]
-
blk.11.attn_norm.weightF32[7168]
-
blk.11.ffn_down.0.weightQ4_K[20480 7168]
-
blk.11.ffn_down.1.weightQ4_K[20480 7168]
-
blk.11.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.11.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.11.ffn_norm.weightF32[7168]
-
blk.11.attn_q.weightQ4_K[7168 7168]
-
blk.11.attn_k.weightQ4_K[7168 1024]
-
blk.11.attn_output.weightQ4_K[7168 7168]
-
blk.11.attn_v.weightQ6_K[7168 1024]
-
blk.11.ffn_gate_inp.weightF16[7168 2]
-
blk.12.ffn_up.0.weightQ4_K[7168 20480]
-
blk.12.ffn_up.1.weightQ4_K[7168 20480]
-
blk.12.attn_norm.weightF32[7168]
-
blk.12.ffn_down.0.weightQ4_K[20480 7168]
-
blk.12.ffn_down.1.weightQ4_K[20480 7168]
-
blk.12.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.12.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.12.ffn_norm.weightF32[7168]
-
blk.12.attn_q.weightQ4_K[7168 7168]
-
blk.12.attn_k.weightQ4_K[7168 1024]
-
blk.12.attn_output.weightQ4_K[7168 7168]
-
blk.12.attn_v.weightQ6_K[7168 1024]
-
blk.12.ffn_gate_inp.weightF16[7168 2]
-
blk.13.ffn_up.0.weightQ4_K[7168 20480]
-
blk.13.attn_norm.weightF32[7168]
-
blk.13.ffn_up.1.weightQ4_K[7168 20480]
-
blk.13.ffn_down.0.weightQ4_K[20480 7168]
-
blk.13.ffn_down.1.weightQ4_K[20480 7168]
-
blk.13.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.13.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.13.ffn_norm.weightF32[7168]
-
blk.13.attn_q.weightQ4_K[7168 7168]
-
blk.13.attn_k.weightQ4_K[7168 1024]
-
blk.13.attn_output.weightQ4_K[7168 7168]
-
blk.13.attn_v.weightQ6_K[7168 1024]
-
blk.13.ffn_gate_inp.weightF16[7168 2]
-
blk.14.attn_norm.weightF32[7168]
-
blk.14.ffn_up.0.weightQ4_K[7168 20480]
-
blk.14.ffn_up.1.weightQ4_K[7168 20480]
-
blk.14.ffn_down.0.weightQ4_K[20480 7168]
-
blk.14.ffn_down.1.weightQ4_K[20480 7168]
-
blk.14.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.14.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.14.ffn_norm.weightF32[7168]
-
blk.14.attn_q.weightQ4_K[7168 7168]
-
blk.14.attn_k.weightQ4_K[7168 1024]
-
blk.14.attn_output.weightQ4_K[7168 7168]
-
blk.14.attn_v.weightQ6_K[7168 1024]
-
blk.14.ffn_gate_inp.weightF16[7168 2]
-
blk.15.attn_norm.weightF32[7168]
-
blk.15.ffn_up.0.weightQ4_K[7168 20480]
-
blk.15.ffn_up.1.weightQ4_K[7168 20480]
-
blk.15.ffn_down.0.weightQ4_K[20480 7168]
-
blk.15.ffn_down.1.weightQ4_K[20480 7168]
-
blk.15.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.15.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.15.ffn_norm.weightF32[7168]
-
blk.15.attn_q.weightQ4_K[7168 7168]
-
blk.15.attn_k.weightQ4_K[7168 1024]
-
blk.15.attn_output.weightQ4_K[7168 7168]
-
blk.15.attn_v.weightQ4_K[7168 1024]
-
blk.15.ffn_gate_inp.weightF16[7168 2]
-
blk.16.attn_norm.weightF32[7168]
-
blk.16.ffn_up.0.weightQ4_K[7168 20480]
-
blk.16.ffn_up.1.weightQ4_K[7168 20480]
-
blk.16.ffn_down.0.weightQ4_K[20480 7168]
-
blk.16.ffn_down.1.weightQ4_K[20480 7168]
-
blk.16.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.16.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.16.ffn_norm.weightF32[7168]
-
blk.16.attn_q.weightQ4_K[7168 7168]
-
blk.16.attn_k.weightQ4_K[7168 1024]
-
blk.16.attn_output.weightQ4_K[7168 7168]
-
blk.16.attn_v.weightQ4_K[7168 1024]
-
blk.16.ffn_gate_inp.weightF16[7168 2]
-
blk.17.attn_norm.weightF32[7168]
-
blk.17.ffn_up.0.weightQ4_K[7168 20480]
-
blk.17.ffn_up.1.weightQ4_K[7168 20480]
-
blk.17.ffn_down.0.weightQ4_K[20480 7168]
-
blk.17.ffn_down.1.weightQ4_K[20480 7168]
-
blk.17.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.17.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.17.ffn_norm.weightF32[7168]
-
blk.17.attn_q.weightQ4_K[7168 7168]
-
blk.17.attn_k.weightQ4_K[7168 1024]
-
blk.17.attn_output.weightQ4_K[7168 7168]
-
blk.17.attn_v.weightQ6_K[7168 1024]
-
blk.17.ffn_gate_inp.weightF16[7168 2]
-
blk.18.attn_norm.weightF32[7168]
-
blk.18.ffn_up.0.weightQ4_K[7168 20480]
-
blk.18.ffn_up.1.weightQ4_K[7168 20480]
-
blk.18.ffn_down.0.weightQ4_K[20480 7168]
-
blk.18.ffn_down.1.weightQ4_K[20480 7168]
-
blk.18.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.18.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.18.ffn_norm.weightF32[7168]
-
blk.18.attn_q.weightQ4_K[7168 7168]
-
blk.18.attn_k.weightQ4_K[7168 1024]
-
blk.18.attn_output.weightQ4_K[7168 7168]
-
blk.18.attn_v.weightQ4_K[7168 1024]
-
blk.18.ffn_gate_inp.weightF16[7168 2]
-
blk.19.attn_norm.weightF32[7168]
-
blk.19.ffn_up.0.weightQ4_K[7168 20480]
-
blk.19.ffn_up.1.weightQ4_K[7168 20480]
-
blk.19.ffn_down.0.weightQ4_K[20480 7168]
-
blk.19.ffn_down.1.weightQ4_K[20480 7168]
-
blk.19.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.19.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.19.ffn_norm.weightF32[7168]
-
blk.19.attn_q.weightQ4_K[7168 7168]
-
blk.19.attn_k.weightQ4_K[7168 1024]
-
blk.19.attn_output.weightQ4_K[7168 7168]
-
blk.19.attn_v.weightQ4_K[7168 1024]
-
blk.19.ffn_gate_inp.weightF16[7168 2]
-
blk.20.attn_norm.weightF32[7168]
-
blk.20.ffn_up.0.weightQ4_K[7168 20480]
-
blk.20.ffn_up.1.weightQ4_K[7168 20480]
-
blk.20.ffn_down.0.weightQ4_K[20480 7168]
-
blk.20.ffn_down.1.weightQ4_K[20480 7168]
-
blk.20.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.20.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.20.ffn_norm.weightF32[7168]
-
blk.20.attn_k.weightQ4_K[7168 1024]
-
blk.20.attn_output.weightQ4_K[7168 7168]
-
blk.20.attn_q.weightQ4_K[7168 7168]
-
blk.20.attn_v.weightQ4_K[7168 1024]
-
blk.20.ffn_gate_inp.weightF16[7168 2]
-
blk.21.attn_norm.weightF32[7168]
-
blk.21.ffn_up.0.weightQ4_K[7168 20480]
-
blk.21.ffn_up.1.weightQ4_K[7168 20480]
-
blk.21.ffn_down.0.weightQ4_K[20480 7168]
-
blk.21.ffn_down.1.weightQ4_K[20480 7168]
-
blk.21.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.21.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.21.ffn_norm.weightF32[7168]
-
blk.21.attn_k.weightQ4_K[7168 1024]
-
blk.21.attn_output.weightQ4_K[7168 7168]
-
blk.21.attn_q.weightQ4_K[7168 7168]
-
blk.21.attn_v.weightQ4_K[7168 1024]
-
blk.21.ffn_gate_inp.weightF16[7168 2]
-
blk.22.attn_norm.weightF32[7168]
-
blk.22.ffn_up.0.weightQ4_K[7168 20480]
-
blk.22.ffn_up.1.weightQ4_K[7168 20480]
-
blk.22.ffn_down.0.weightQ4_K[20480 7168]
-
blk.22.ffn_down.1.weightQ4_K[20480 7168]
-
blk.22.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.22.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.22.ffn_norm.weightF32[7168]
-
blk.22.attn_k.weightQ4_K[7168 1024]
-
blk.22.attn_output.weightQ4_K[7168 7168]
-
blk.22.attn_q.weightQ4_K[7168 7168]
-
blk.22.attn_v.weightQ6_K[7168 1024]
-
blk.22.ffn_gate_inp.weightF16[7168 2]
-
blk.23.attn_norm.weightF32[7168]
-
blk.23.ffn_up.0.weightQ4_K[7168 20480]
-
blk.23.ffn_up.1.weightQ4_K[7168 20480]
-
blk.23.ffn_down.0.weightQ4_K[20480 7168]
-
blk.23.ffn_down.1.weightQ4_K[20480 7168]
-
blk.23.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.23.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.23.ffn_norm.weightF32[7168]
-
blk.23.attn_k.weightQ4_K[7168 1024]
-
blk.23.attn_output.weightQ4_K[7168 7168]
-
blk.23.attn_q.weightQ4_K[7168 7168]
-
blk.23.attn_v.weightQ4_K[7168 1024]
-
blk.23.ffn_gate_inp.weightF16[7168 2]
-
blk.24.attn_norm.weightF32[7168]
-
blk.24.ffn_up.0.weightQ4_K[7168 20480]
-
blk.24.ffn_up.1.weightQ4_K[7168 20480]
-
blk.24.ffn_down.0.weightQ4_K[20480 7168]
-
blk.24.ffn_down.1.weightQ4_K[20480 7168]
-
blk.24.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.24.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.24.ffn_norm.weightF32[7168]
-
blk.24.attn_k.weightQ4_K[7168 1024]
-
blk.24.attn_output.weightQ4_K[7168 7168]
-
blk.24.attn_q.weightQ4_K[7168 7168]
-
blk.24.attn_v.weightQ4_K[7168 1024]
-
blk.24.ffn_gate_inp.weightF16[7168 2]
-
blk.25.attn_norm.weightF32[7168]
-
blk.25.ffn_up.0.weightQ4_K[7168 20480]
-
blk.25.ffn_up.1.weightQ4_K[7168 20480]
-
blk.25.ffn_down.0.weightQ4_K[20480 7168]
-
blk.25.ffn_down.1.weightQ4_K[20480 7168]
-
blk.25.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.25.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.25.ffn_norm.weightF32[7168]
-
blk.25.attn_k.weightQ4_K[7168 1024]
-
blk.25.attn_output.weightQ4_K[7168 7168]
-
blk.25.attn_q.weightQ4_K[7168 7168]
-
blk.25.attn_v.weightQ6_K[7168 1024]
-
blk.25.ffn_gate_inp.weightF16[7168 2]
-
blk.26.attn_norm.weightF32[7168]
-
blk.26.ffn_up.0.weightQ4_K[7168 20480]
-
blk.26.ffn_up.1.weightQ4_K[7168 20480]
-
blk.26.ffn_down.0.weightQ4_K[20480 7168]
-
blk.26.ffn_down.1.weightQ4_K[20480 7168]
-
blk.26.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.26.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.26.ffn_norm.weightF32[7168]
-
blk.26.attn_k.weightQ4_K[7168 1024]
-
blk.26.attn_output.weightQ4_K[7168 7168]
-
blk.26.attn_q.weightQ4_K[7168 7168]
-
blk.26.attn_v.weightQ4_K[7168 1024]
-
blk.26.ffn_gate_inp.weightF16[7168 2]
-
blk.27.attn_norm.weightF32[7168]
-
blk.27.ffn_up.0.weightQ4_K[7168 20480]
-
blk.27.ffn_up.1.weightQ4_K[7168 20480]
-
blk.27.ffn_down.0.weightQ4_K[20480 7168]
-
blk.27.ffn_down.1.weightQ4_K[20480 7168]
-
blk.27.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.27.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.27.ffn_norm.weightF32[7168]
-
blk.27.attn_k.weightQ4_K[7168 1024]
-
blk.27.attn_output.weightQ4_K[7168 7168]
-
blk.27.attn_q.weightQ4_K[7168 7168]
-
blk.27.attn_v.weightQ4_K[7168 1024]
-
blk.27.ffn_gate_inp.weightF16[7168 2]
-
blk.28.attn_norm.weightF32[7168]
-
blk.28.ffn_up.0.weightQ4_K[7168 20480]
-
blk.28.ffn_up.1.weightQ4_K[7168 20480]
-
blk.28.ffn_down.0.weightQ4_K[20480 7168]
-
blk.28.ffn_down.1.weightQ4_K[20480 7168]
-
blk.28.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.28.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.28.ffn_norm.weightF32[7168]
-
blk.28.attn_k.weightQ4_K[7168 1024]
-
blk.28.attn_output.weightQ4_K[7168 7168]
-
blk.28.attn_q.weightQ4_K[7168 7168]
-
blk.28.attn_v.weightQ6_K[7168 1024]
-
blk.28.ffn_gate_inp.weightF16[7168 2]
-
blk.29.attn_norm.weightF32[7168]
-
blk.29.ffn_up.0.weightQ4_K[7168 20480]
-
blk.29.ffn_up.1.weightQ4_K[7168 20480]
-
blk.29.ffn_down.0.weightQ4_K[20480 7168]
-
blk.29.ffn_down.1.weightQ4_K[20480 7168]
-
blk.29.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.29.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.29.ffn_norm.weightF32[7168]
-
blk.29.attn_k.weightQ4_K[7168 1024]
-
blk.29.attn_output.weightQ4_K[7168 7168]
-
blk.29.attn_q.weightQ4_K[7168 7168]
-
blk.29.attn_v.weightQ4_K[7168 1024]
-
blk.29.ffn_gate_inp.weightF16[7168 2]
-
blk.30.attn_norm.weightF32[7168]
-
blk.30.ffn_up.0.weightQ4_K[7168 20480]
-
blk.30.ffn_up.1.weightQ4_K[7168 20480]
-
blk.30.ffn_down.0.weightQ4_K[20480 7168]
-
blk.30.ffn_down.1.weightQ4_K[20480 7168]
-
blk.30.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.30.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.30.ffn_norm.weightF32[7168]
-
blk.30.attn_k.weightQ4_K[7168 1024]
-
blk.30.attn_output.weightQ4_K[7168 7168]
-
blk.30.attn_q.weightQ4_K[7168 7168]
-
blk.30.attn_v.weightQ6_K[7168 1024]
-
blk.30.ffn_gate_inp.weightF16[7168 2]
-
blk.31.attn_norm.weightF32[7168]
-
blk.31.ffn_up.0.weightQ4_K[7168 20480]
-
blk.31.ffn_up.1.weightQ4_K[7168 20480]
-
blk.31.ffn_down.0.weightQ4_K[20480 7168]
-
blk.31.ffn_down.1.weightQ4_K[20480 7168]
-
blk.31.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.31.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.31.ffn_norm.weightF32[7168]
-
blk.31.attn_k.weightQ4_K[7168 1024]
-
blk.31.attn_output.weightQ4_K[7168 7168]
-
blk.31.attn_q.weightQ4_K[7168 7168]
-
blk.31.attn_v.weightQ4_K[7168 1024]
-
blk.31.ffn_gate_inp.weightF16[7168 2]
-
blk.32.attn_norm.weightF32[7168]
-
blk.32.ffn_up.0.weightQ4_K[7168 20480]
-
blk.32.ffn_up.1.weightQ4_K[7168 20480]
-
blk.32.ffn_down.0.weightQ4_K[20480 7168]
-
blk.32.ffn_down.1.weightQ4_K[20480 7168]
-
blk.32.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.32.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.32.ffn_norm.weightF32[7168]
-
blk.32.attn_k.weightQ4_K[7168 1024]
-
blk.32.attn_output.weightQ4_K[7168 7168]
-
blk.32.attn_q.weightQ4_K[7168 7168]
-
blk.32.attn_v.weightQ4_K[7168 1024]
-
blk.32.ffn_gate_inp.weightF16[7168 2]
-
blk.33.attn_norm.weightF32[7168]
-
blk.33.ffn_up.0.weightQ4_K[7168 20480]
-
blk.33.ffn_up.1.weightQ4_K[7168 20480]
-
blk.33.ffn_down.0.weightQ4_K[20480 7168]
-
blk.33.ffn_down.1.weightQ4_K[20480 7168]
-
blk.33.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.33.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.33.ffn_norm.weightF32[7168]
-
blk.33.attn_k.weightQ4_K[7168 1024]
-
blk.33.attn_output.weightQ4_K[7168 7168]
-
blk.33.attn_q.weightQ4_K[7168 7168]
-
blk.33.attn_v.weightQ6_K[7168 1024]
-
blk.33.ffn_gate_inp.weightF16[7168 2]
-
blk.34.attn_norm.weightF32[7168]
-
blk.34.ffn_up.0.weightQ4_K[7168 20480]
-
blk.34.ffn_up.1.weightQ4_K[7168 20480]
-
blk.34.ffn_down.0.weightQ4_K[20480 7168]
-
blk.34.ffn_down.1.weightQ4_K[20480 7168]
-
blk.34.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.34.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.34.ffn_norm.weightF32[7168]
-
blk.34.attn_k.weightQ4_K[7168 1024]
-
blk.34.attn_output.weightQ4_K[7168 7168]
-
blk.34.attn_q.weightQ4_K[7168 7168]
-
blk.34.attn_v.weightQ4_K[7168 1024]
-
blk.34.ffn_gate_inp.weightF16[7168 2]
-
blk.35.attn_norm.weightF32[7168]
-
blk.35.ffn_up.0.weightQ4_K[7168 20480]
-
blk.35.ffn_up.1.weightQ4_K[7168 20480]
-
blk.35.ffn_down.0.weightQ4_K[20480 7168]
-
blk.35.ffn_down.1.weightQ4_K[20480 7168]
-
blk.35.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.35.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.35.ffn_norm.weightF32[7168]
-
blk.35.attn_k.weightQ4_K[7168 1024]
-
blk.35.attn_output.weightQ4_K[7168 7168]
-
blk.35.attn_q.weightQ4_K[7168 7168]
-
blk.35.attn_v.weightQ4_K[7168 1024]
-
blk.35.ffn_gate_inp.weightF16[7168 2]
-
blk.36.attn_norm.weightF32[7168]
-
blk.36.ffn_up.0.weightQ4_K[7168 20480]
-
blk.36.ffn_up.1.weightQ4_K[7168 20480]
-
blk.36.ffn_down.0.weightQ4_K[20480 7168]
-
blk.36.ffn_down.1.weightQ4_K[20480 7168]
-
blk.36.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.36.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.36.ffn_norm.weightF32[7168]
-
blk.36.attn_k.weightQ4_K[7168 1024]
-
blk.36.attn_output.weightQ4_K[7168 7168]
-
blk.36.attn_q.weightQ4_K[7168 7168]
-
blk.36.attn_v.weightQ6_K[7168 1024]
-
blk.36.ffn_gate_inp.weightF16[7168 2]
-
blk.37.attn_norm.weightF32[7168]
-
blk.37.ffn_up.0.weightQ4_K[7168 20480]
-
blk.37.ffn_up.1.weightQ4_K[7168 20480]
-
blk.37.ffn_down.0.weightQ4_K[20480 7168]
-
blk.37.ffn_down.1.weightQ4_K[20480 7168]
-
blk.37.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.37.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.37.ffn_norm.weightF32[7168]
-
blk.37.attn_k.weightQ4_K[7168 1024]
-
blk.37.attn_output.weightQ4_K[7168 7168]
-
blk.37.attn_q.weightQ4_K[7168 7168]
-
blk.37.attn_v.weightQ4_K[7168 1024]
-
blk.37.ffn_gate_inp.weightF16[7168 2]
-
blk.38.attn_norm.weightF32[7168]
-
blk.38.ffn_up.0.weightQ4_K[7168 20480]
-
blk.38.ffn_up.1.weightQ4_K[7168 20480]
-
blk.38.ffn_down.0.weightQ4_K[20480 7168]
-
blk.38.ffn_down.1.weightQ4_K[20480 7168]
-
blk.38.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.38.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.38.ffn_norm.weightF32[7168]
-
blk.38.attn_k.weightQ4_K[7168 1024]
-
blk.38.attn_output.weightQ4_K[7168 7168]
-
blk.38.attn_q.weightQ4_K[7168 7168]
-
blk.38.attn_v.weightQ4_K[7168 1024]
-
blk.38.ffn_gate_inp.weightF16[7168 2]
-
blk.39.attn_norm.weightF32[7168]
-
blk.39.ffn_up.0.weightQ4_K[7168 20480]
-
blk.39.ffn_up.1.weightQ4_K[7168 20480]
-
blk.39.ffn_down.0.weightQ4_K[20480 7168]
-
blk.39.ffn_down.1.weightQ4_K[20480 7168]
-
blk.39.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.39.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.39.ffn_norm.weightF32[7168]
-
blk.39.attn_k.weightQ4_K[7168 1024]
-
blk.39.attn_output.weightQ4_K[7168 7168]
-
blk.39.attn_q.weightQ4_K[7168 7168]
-
blk.39.attn_v.weightQ6_K[7168 1024]
-
blk.39.ffn_gate_inp.weightF16[7168 2]
-
blk.40.attn_norm.weightF32[7168]
-
blk.40.ffn_up.0.weightQ4_K[7168 20480]
-
blk.40.ffn_up.1.weightQ4_K[7168 20480]
-
blk.40.ffn_down.0.weightQ4_K[20480 7168]
-
blk.40.ffn_down.1.weightQ4_K[20480 7168]
-
blk.40.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.40.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.40.ffn_norm.weightF32[7168]
-
blk.40.attn_k.weightQ4_K[7168 1024]
-
blk.40.attn_q.weightQ4_K[7168 7168]
-
blk.40.attn_v.weightQ4_K[7168 1024]
-
blk.40.ffn_gate_inp.weightF16[7168 2]
-
blk.40.attn_output.weightQ4_K[7168 7168]
-
blk.41.attn_norm.weightF32[7168]
-
blk.41.ffn_up.0.weightQ4_K[7168 20480]
-
blk.41.ffn_up.1.weightQ4_K[7168 20480]
-
blk.41.ffn_down.0.weightQ4_K[20480 7168]
-
blk.41.ffn_down.1.weightQ4_K[20480 7168]
-
blk.41.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.41.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.41.ffn_norm.weightF32[7168]
-
blk.41.attn_k.weightQ4_K[7168 1024]
-
blk.41.attn_q.weightQ4_K[7168 7168]
-
blk.41.attn_v.weightQ6_K[7168 1024]
-
blk.41.ffn_gate_inp.weightF16[7168 2]
-
blk.41.attn_output.weightQ4_K[7168 7168]
-
blk.42.attn_norm.weightF32[7168]
-
blk.42.ffn_up.0.weightQ4_K[7168 20480]
-
blk.42.ffn_up.1.weightQ4_K[7168 20480]
-
blk.42.ffn_down.0.weightQ4_K[20480 7168]
-
blk.42.ffn_down.1.weightQ4_K[20480 7168]
-
blk.42.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.42.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.42.ffn_norm.weightF32[7168]
-
blk.42.attn_k.weightQ4_K[7168 1024]
-
blk.42.attn_q.weightQ4_K[7168 7168]
-
blk.42.attn_v.weightQ4_K[7168 1024]
-
blk.42.ffn_gate_inp.weightF16[7168 2]
-
blk.42.attn_output.weightQ4_K[7168 7168]
-
blk.43.attn_norm.weightF32[7168]
-
blk.43.ffn_up.0.weightQ4_K[7168 20480]
-
blk.43.ffn_up.1.weightQ4_K[7168 20480]
-
blk.43.ffn_down.0.weightQ4_K[20480 7168]
-
blk.43.ffn_down.1.weightQ4_K[20480 7168]
-
blk.43.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.43.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.43.ffn_norm.weightF32[7168]
-
blk.43.attn_k.weightQ4_K[7168 1024]
-
blk.43.attn_q.weightQ4_K[7168 7168]
-
blk.43.attn_v.weightQ4_K[7168 1024]
-
blk.43.ffn_gate_inp.weightF16[7168 2]
-
blk.43.attn_output.weightQ4_K[7168 7168]
-
blk.44.attn_norm.weightF32[7168]
-
blk.44.ffn_up.0.weightQ4_K[7168 20480]
-
blk.44.ffn_up.1.weightQ4_K[7168 20480]
-
blk.44.ffn_down.0.weightQ4_K[20480 7168]
-
blk.44.ffn_down.1.weightQ4_K[20480 7168]
-
blk.44.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.44.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.44.ffn_norm.weightF32[7168]
-
blk.44.attn_k.weightQ4_K[7168 1024]
-
blk.44.attn_q.weightQ4_K[7168 7168]
-
blk.44.attn_v.weightQ6_K[7168 1024]
-
blk.44.ffn_gate_inp.weightF16[7168 2]
-
blk.44.attn_output.weightQ4_K[7168 7168]
-
blk.45.attn_norm.weightF32[7168]
-
blk.45.ffn_up.0.weightQ4_K[7168 20480]
-
blk.45.ffn_up.1.weightQ4_K[7168 20480]
-
blk.45.ffn_down.0.weightQ4_K[20480 7168]
-
blk.45.ffn_down.1.weightQ4_K[20480 7168]
-
blk.45.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.45.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.45.ffn_norm.weightF32[7168]
-
blk.45.attn_k.weightQ4_K[7168 1024]
-
blk.45.attn_q.weightQ4_K[7168 7168]
-
blk.45.attn_v.weightQ4_K[7168 1024]
-
blk.45.ffn_gate_inp.weightF16[7168 2]
-
blk.45.attn_output.weightQ4_K[7168 7168]
-
blk.46.attn_norm.weightF32[7168]
-
blk.46.ffn_up.0.weightQ4_K[7168 20480]
-
blk.46.ffn_up.1.weightQ4_K[7168 20480]
-
blk.46.ffn_down.0.weightQ4_K[20480 7168]
-
blk.46.ffn_down.1.weightQ4_K[20480 7168]
-
blk.46.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.46.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.46.ffn_norm.weightF32[7168]
-
blk.46.attn_k.weightQ4_K[7168 1024]
-
blk.46.attn_q.weightQ4_K[7168 7168]
-
blk.46.attn_v.weightQ4_K[7168 1024]
-
blk.46.ffn_gate_inp.weightF16[7168 2]
-
blk.46.attn_output.weightQ4_K[7168 7168]
-
blk.47.attn_norm.weightF32[7168]
-
blk.47.ffn_up.0.weightQ4_K[7168 20480]
-
blk.47.ffn_up.1.weightQ4_K[7168 20480]
-
blk.47.ffn_down.0.weightQ4_K[20480 7168]
-
blk.47.ffn_down.1.weightQ4_K[20480 7168]
-
blk.47.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.47.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.47.ffn_norm.weightF32[7168]
-
blk.47.attn_k.weightQ4_K[7168 1024]
-
blk.47.attn_q.weightQ4_K[7168 7168]
-
blk.47.attn_v.weightQ6_K[7168 1024]
-
blk.47.ffn_gate_inp.weightF16[7168 2]
-
blk.47.attn_output.weightQ4_K[7168 7168]
-
blk.48.attn_norm.weightF32[7168]
-
blk.48.ffn_up.0.weightQ4_K[7168 20480]
-
blk.48.ffn_up.1.weightQ4_K[7168 20480]
-
blk.48.ffn_down.0.weightQ4_K[20480 7168]
-
blk.48.ffn_down.1.weightQ4_K[20480 7168]
-
blk.48.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.48.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.48.ffn_norm.weightF32[7168]
-
blk.48.attn_k.weightQ4_K[7168 1024]
-
blk.48.attn_q.weightQ4_K[7168 7168]
-
blk.48.attn_v.weightQ4_K[7168 1024]
-
blk.48.ffn_gate_inp.weightF16[7168 2]
-
blk.48.attn_output.weightQ4_K[7168 7168]
-
blk.49.attn_norm.weightF32[7168]
-
blk.49.ffn_up.0.weightQ4_K[7168 20480]
-
blk.49.ffn_up.1.weightQ4_K[7168 20480]
-
blk.49.ffn_down.0.weightQ4_K[20480 7168]
-
blk.49.ffn_down.1.weightQ4_K[20480 7168]
-
blk.49.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.49.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.49.ffn_norm.weightF32[7168]
-
blk.49.attn_k.weightQ4_K[7168 1024]
-
blk.49.attn_q.weightQ4_K[7168 7168]
-
blk.49.attn_v.weightQ4_K[7168 1024]
-
blk.49.ffn_gate_inp.weightF16[7168 2]
-
blk.49.attn_output.weightQ4_K[7168 7168]
-
blk.50.attn_norm.weightF32[7168]
-
blk.50.ffn_up.0.weightQ4_K[7168 20480]
-
blk.50.ffn_up.1.weightQ4_K[7168 20480]
-
blk.50.ffn_down.0.weightQ4_K[20480 7168]
-
blk.50.ffn_down.1.weightQ4_K[20480 7168]
-
blk.50.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.50.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.50.ffn_norm.weightF32[7168]
-
blk.50.attn_k.weightQ4_K[7168 1024]
-
blk.50.attn_q.weightQ4_K[7168 7168]
-
blk.50.attn_v.weightQ4_K[7168 1024]
-
blk.50.ffn_gate_inp.weightF16[7168 2]
-
blk.50.attn_output.weightQ4_K[7168 7168]
-
blk.51.attn_norm.weightF32[7168]
-
blk.51.ffn_up.0.weightQ4_K[7168 20480]
-
blk.51.ffn_up.1.weightQ4_K[7168 20480]
-
blk.51.ffn_down.0.weightQ4_K[20480 7168]
-
blk.51.ffn_down.1.weightQ4_K[20480 7168]
-
blk.51.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.51.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.51.ffn_norm.weightF32[7168]
-
blk.51.attn_k.weightQ4_K[7168 1024]
-
blk.51.attn_q.weightQ4_K[7168 7168]
-
blk.51.attn_v.weightQ4_K[7168 1024]
-
blk.51.ffn_gate_inp.weightF16[7168 2]
-
blk.51.attn_output.weightQ4_K[7168 7168]
-
blk.52.attn_norm.weightF32[7168]
-
blk.52.ffn_up.0.weightQ4_K[7168 20480]
-
blk.52.ffn_up.1.weightQ4_K[7168 20480]
-
blk.52.ffn_down.0.weightQ4_K[20480 7168]
-
blk.52.ffn_down.1.weightQ4_K[20480 7168]
-
blk.52.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.52.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.52.ffn_norm.weightF32[7168]
-
blk.52.attn_k.weightQ4_K[7168 1024]
-
blk.52.attn_q.weightQ4_K[7168 7168]
-
blk.52.attn_v.weightQ6_K[7168 1024]
-
blk.52.ffn_gate_inp.weightF16[7168 2]
-
blk.52.attn_output.weightQ4_K[7168 7168]
-
blk.53.attn_norm.weightF32[7168]
-
blk.53.ffn_up.0.weightQ4_K[7168 20480]
-
blk.53.ffn_up.1.weightQ4_K[7168 20480]
-
blk.53.ffn_down.0.weightQ4_K[20480 7168]
-
blk.53.ffn_down.1.weightQ4_K[20480 7168]
-
blk.53.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.53.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.53.ffn_norm.weightF32[7168]
-
blk.53.attn_k.weightQ4_K[7168 1024]
-
blk.53.attn_q.weightQ4_K[7168 7168]
-
blk.53.attn_v.weightQ4_K[7168 1024]
-
blk.53.ffn_gate_inp.weightF16[7168 2]
-
blk.53.attn_output.weightQ4_K[7168 7168]
-
blk.54.attn_norm.weightF32[7168]
-
blk.54.ffn_up.0.weightQ4_K[7168 20480]
-
blk.54.ffn_up.1.weightQ4_K[7168 20480]
-
blk.54.ffn_down.0.weightQ4_K[20480 7168]
-
blk.54.ffn_down.1.weightQ4_K[20480 7168]
-
blk.54.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.54.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.54.ffn_norm.weightF32[7168]
-
blk.54.attn_k.weightQ4_K[7168 1024]
-
blk.54.attn_q.weightQ4_K[7168 7168]
-
blk.54.attn_v.weightQ4_K[7168 1024]
-
blk.54.ffn_gate_inp.weightF16[7168 2]
-
blk.54.attn_output.weightQ4_K[7168 7168]
-
blk.55.attn_norm.weightF32[7168]
-
blk.55.ffn_up.0.weightQ4_K[7168 20480]
-
blk.55.ffn_up.1.weightQ4_K[7168 20480]
-
blk.55.ffn_down.0.weightQ4_K[20480 7168]
-
blk.55.ffn_down.1.weightQ4_K[20480 7168]
-
blk.55.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.55.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.55.ffn_norm.weightF32[7168]
-
blk.55.attn_k.weightQ4_K[7168 1024]
-
blk.55.attn_q.weightQ4_K[7168 7168]
-
blk.55.attn_v.weightQ6_K[7168 1024]
-
blk.55.ffn_gate_inp.weightF16[7168 2]
-
blk.55.attn_output.weightQ4_K[7168 7168]
-
blk.56.attn_norm.weightF32[7168]
-
blk.56.ffn_up.0.weightQ4_K[7168 20480]
-
blk.56.ffn_up.1.weightQ4_K[7168 20480]
-
blk.56.ffn_down.0.weightQ4_K[20480 7168]
-
blk.56.ffn_down.1.weightQ4_K[20480 7168]
-
blk.56.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.56.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.56.ffn_norm.weightF32[7168]
-
blk.56.attn_k.weightQ4_K[7168 1024]
-
blk.56.attn_q.weightQ4_K[7168 7168]
-
blk.56.attn_v.weightQ6_K[7168 1024]
-
blk.56.ffn_gate_inp.weightF16[7168 2]
-
blk.56.attn_output.weightQ4_K[7168 7168]
-
blk.57.attn_norm.weightF32[7168]
-
blk.57.ffn_up.0.weightQ4_K[7168 20480]
-
blk.57.ffn_up.1.weightQ4_K[7168 20480]
-
blk.57.ffn_down.0.weightQ4_K[20480 7168]
-
blk.57.ffn_down.1.weightQ4_K[20480 7168]
-
blk.57.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.57.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.57.ffn_norm.weightF32[7168]
-
blk.57.attn_k.weightQ4_K[7168 1024]
-
blk.57.attn_q.weightQ4_K[7168 7168]
-
blk.57.attn_v.weightQ6_K[7168 1024]
-
blk.57.ffn_gate_inp.weightF16[7168 2]
-
blk.57.attn_output.weightQ4_K[7168 7168]
-
blk.58.attn_norm.weightF32[7168]
-
blk.58.ffn_up.0.weightQ4_K[7168 20480]
-
blk.58.ffn_up.1.weightQ4_K[7168 20480]
-
blk.58.ffn_down.0.weightQ4_K[20480 7168]
-
blk.58.ffn_down.1.weightQ4_K[20480 7168]
-
blk.58.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.58.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.58.ffn_norm.weightF32[7168]
-
blk.58.attn_k.weightQ4_K[7168 1024]
-
blk.58.attn_q.weightQ4_K[7168 7168]
-
blk.58.attn_v.weightQ6_K[7168 1024]
-
blk.58.ffn_gate_inp.weightF16[7168 2]
-
blk.58.attn_output.weightQ4_K[7168 7168]
-
blk.59.attn_norm.weightF32[7168]
-
blk.59.ffn_up.0.weightQ4_K[7168 20480]
-
blk.59.ffn_up.1.weightQ4_K[7168 20480]
-
blk.59.ffn_down.0.weightQ4_K[20480 7168]
-
blk.59.ffn_down.1.weightQ4_K[20480 7168]
-
blk.59.ffn_gate.0.weightQ4_K[7168 20480]
-
blk.59.ffn_gate.1.weightQ4_K[7168 20480]
-
blk.59.ffn_norm.weightF32[7168]
-
blk.59.attn_k.weightQ4_K[7168 1024]
-
blk.59.attn_q.weightQ4_K[7168 7168]
-
blk.59.attn_v.weightQ6_K[7168 1024]
-
blk.59.ffn_gate_inp.weightF16[7168 2]
-
blk.59.attn_output.weightQ4_K[7168 7168]
-
output.weightQ6_K[7168 64000]
-
output_norm.weightF32[7168]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59