latest
40GB
Midnight-Miqu-70B-v1.5-GGUF Q4_K_S & Q4_K_M
70B
661 Pulls Updated 5 months ago
0ab2054889a9 · 42GB
-
general.architecturellama
-
general.file_typeQ4_K_M
-
llama.attention.head_count64
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count80
-
llama.context_length32764
-
llama.embedding_length8192
-
llama.feed_forward_length28672
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+06
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id0
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[2 3 3 6 6 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> <0x00> <0x01> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ4_K[8192 32000]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.ffn_down.weightQ6_K[28672 8192]
-
blk.0.ffn_gate.weightQ4_K[8192 28672]
-
blk.0.ffn_up.weightQ4_K[8192 28672]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.attn_k.weightQ4_K[8192 1024]
-
blk.0.attn_output.weightQ4_K[8192 8192]
-
blk.0.attn_q.weightQ4_K[8192 8192]
-
blk.0.attn_v.weightQ6_K[8192 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.ffn_down.weightQ6_K[28672 8192]
-
blk.1.ffn_gate.weightQ4_K[8192 28672]
-
blk.1.ffn_up.weightQ4_K[8192 28672]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.1.attn_k.weightQ4_K[8192 1024]
-
blk.1.attn_output.weightQ4_K[8192 8192]
-
blk.1.attn_q.weightQ4_K[8192 8192]
-
blk.1.attn_v.weightQ6_K[8192 1024]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.ffn_down.weightQ6_K[28672 8192]
-
blk.2.ffn_gate.weightQ4_K[8192 28672]
-
blk.2.ffn_up.weightQ4_K[8192 28672]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.2.attn_k.weightQ4_K[8192 1024]
-
blk.2.attn_output.weightQ4_K[8192 8192]
-
blk.2.attn_q.weightQ4_K[8192 8192]
-
blk.2.attn_v.weightQ6_K[8192 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.ffn_down.weightQ6_K[28672 8192]
-
blk.3.ffn_gate.weightQ4_K[8192 28672]
-
blk.3.ffn_up.weightQ4_K[8192 28672]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.3.attn_k.weightQ4_K[8192 1024]
-
blk.3.attn_output.weightQ4_K[8192 8192]
-
blk.3.attn_q.weightQ4_K[8192 8192]
-
blk.3.attn_v.weightQ6_K[8192 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.ffn_down.weightQ6_K[28672 8192]
-
blk.4.ffn_gate.weightQ4_K[8192 28672]
-
blk.4.ffn_up.weightQ4_K[8192 28672]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.4.attn_k.weightQ4_K[8192 1024]
-
blk.4.attn_output.weightQ4_K[8192 8192]
-
blk.4.attn_q.weightQ4_K[8192 8192]
-
blk.4.attn_v.weightQ6_K[8192 1024]
-
blk.5.attn_k.weightQ4_K[8192 1024]
-
blk.5.attn_output.weightQ4_K[8192 8192]
-
blk.5.attn_q.weightQ4_K[8192 8192]
-
blk.5.attn_v.weightQ6_K[8192 1024]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.ffn_down.weightQ6_K[28672 8192]
-
blk.5.ffn_gate.weightQ4_K[8192 28672]
-
blk.5.ffn_up.weightQ4_K[8192 28672]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.ffn_down.weightQ6_K[28672 8192]
-
blk.6.ffn_gate.weightQ4_K[8192 28672]
-
blk.6.ffn_up.weightQ4_K[8192 28672]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.6.attn_k.weightQ4_K[8192 1024]
-
blk.6.attn_output.weightQ4_K[8192 8192]
-
blk.6.attn_q.weightQ4_K[8192 8192]
-
blk.6.attn_v.weightQ6_K[8192 1024]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.ffn_down.weightQ6_K[28672 8192]
-
blk.7.ffn_gate.weightQ4_K[8192 28672]
-
blk.7.ffn_up.weightQ4_K[8192 28672]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.7.attn_k.weightQ4_K[8192 1024]
-
blk.7.attn_output.weightQ4_K[8192 8192]
-
blk.7.attn_q.weightQ4_K[8192 8192]
-
blk.7.attn_v.weightQ6_K[8192 1024]
-
blk.8.attn_k.weightQ4_K[8192 1024]
-
blk.8.attn_q.weightQ4_K[8192 8192]
-
blk.8.attn_v.weightQ6_K[8192 1024]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.ffn_down.weightQ6_K[28672 8192]
-
blk.8.ffn_gate.weightQ4_K[8192 28672]
-
blk.8.ffn_up.weightQ4_K[8192 28672]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.attn_output.weightQ4_K[8192 8192]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.ffn_down.weightQ4_K[28672 8192]
-
blk.9.ffn_gate.weightQ4_K[8192 28672]
-
blk.9.ffn_up.weightQ4_K[8192 28672]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.attn_k.weightQ4_K[8192 1024]
-
blk.9.attn_output.weightQ4_K[8192 8192]
-
blk.9.attn_q.weightQ4_K[8192 8192]
-
blk.9.attn_v.weightQ5_K[8192 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.ffn_down.weightQ6_K[28672 8192]
-
blk.10.ffn_gate.weightQ4_K[8192 28672]
-
blk.10.ffn_up.weightQ4_K[8192 28672]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.10.attn_k.weightQ4_K[8192 1024]
-
blk.10.attn_output.weightQ4_K[8192 8192]
-
blk.10.attn_q.weightQ4_K[8192 8192]
-
blk.10.attn_v.weightQ6_K[8192 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.ffn_down.weightQ4_K[28672 8192]
-
blk.11.ffn_gate.weightQ4_K[8192 28672]
-
blk.11.ffn_up.weightQ4_K[8192 28672]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.11.attn_k.weightQ4_K[8192 1024]
-
blk.11.attn_output.weightQ4_K[8192 8192]
-
blk.11.attn_q.weightQ4_K[8192 8192]
-
blk.11.attn_v.weightQ5_K[8192 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.ffn_down.weightQ6_K[28672 8192]
-
blk.12.ffn_gate.weightQ4_K[8192 28672]
-
blk.12.ffn_up.weightQ4_K[8192 28672]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.12.attn_k.weightQ4_K[8192 1024]
-
blk.12.attn_output.weightQ4_K[8192 8192]
-
blk.12.attn_q.weightQ4_K[8192 8192]
-
blk.12.attn_v.weightQ6_K[8192 1024]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.ffn_down.weightQ4_K[28672 8192]
-
blk.13.ffn_gate.weightQ4_K[8192 28672]
-
blk.13.ffn_up.weightQ4_K[8192 28672]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.13.attn_k.weightQ4_K[8192 1024]
-
blk.13.attn_output.weightQ4_K[8192 8192]
-
blk.13.attn_q.weightQ4_K[8192 8192]
-
blk.13.attn_v.weightQ5_K[8192 1024]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.ffn_down.weightQ4_K[28672 8192]
-
blk.14.ffn_gate.weightQ4_K[8192 28672]
-
blk.14.ffn_up.weightQ4_K[8192 28672]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.14.attn_k.weightQ4_K[8192 1024]
-
blk.14.attn_output.weightQ4_K[8192 8192]
-
blk.14.attn_q.weightQ4_K[8192 8192]
-
blk.14.attn_v.weightQ5_K[8192 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.ffn_down.weightQ6_K[28672 8192]
-
blk.15.ffn_gate.weightQ4_K[8192 28672]
-
blk.15.ffn_up.weightQ4_K[8192 28672]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.15.attn_k.weightQ4_K[8192 1024]
-
blk.15.attn_output.weightQ4_K[8192 8192]
-
blk.15.attn_q.weightQ4_K[8192 8192]
-
blk.15.attn_v.weightQ6_K[8192 1024]
-
blk.16.ffn_gate.weightQ4_K[8192 28672]
-
blk.16.attn_k.weightQ4_K[8192 1024]
-
blk.16.attn_output.weightQ4_K[8192 8192]
-
blk.16.attn_q.weightQ4_K[8192 8192]
-
blk.16.attn_v.weightQ5_K[8192 1024]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.ffn_down.weightQ4_K[28672 8192]
-
blk.16.ffn_up.weightQ4_K[8192 28672]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.ffn_down.weightQ4_K[28672 8192]
-
blk.17.ffn_gate.weightQ4_K[8192 28672]
-
blk.17.ffn_up.weightQ4_K[8192 28672]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.17.attn_k.weightQ4_K[8192 1024]
-
blk.17.attn_output.weightQ4_K[8192 8192]
-
blk.17.attn_q.weightQ4_K[8192 8192]
-
blk.17.attn_v.weightQ6_K[8192 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.ffn_down.weightQ6_K[28672 8192]
-
blk.18.ffn_gate.weightQ4_K[8192 28672]
-
blk.18.ffn_up.weightQ4_K[8192 28672]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.18.attn_k.weightQ4_K[8192 1024]
-
blk.18.attn_output.weightQ4_K[8192 8192]
-
blk.18.attn_q.weightQ4_K[8192 8192]
-
blk.18.attn_v.weightQ5_K[8192 1024]
-
blk.19.attn_k.weightQ4_K[8192 1024]
-
blk.19.attn_output.weightQ4_K[8192 8192]
-
blk.19.attn_q.weightQ4_K[8192 8192]
-
blk.19.attn_v.weightQ5_K[8192 1024]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.ffn_down.weightQ4_K[28672 8192]
-
blk.19.ffn_gate.weightQ4_K[8192 28672]
-
blk.19.ffn_up.weightQ4_K[8192 28672]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.ffn_down.weightQ4_K[28672 8192]
-
blk.20.ffn_gate.weightQ4_K[8192 28672]
-
blk.20.ffn_up.weightQ4_K[8192 28672]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.20.attn_k.weightQ4_K[8192 1024]
-
blk.20.attn_output.weightQ4_K[8192 8192]
-
blk.20.attn_q.weightQ4_K[8192 8192]
-
blk.20.attn_v.weightQ5_K[8192 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.ffn_down.weightQ6_K[28672 8192]
-
blk.21.ffn_gate.weightQ4_K[8192 28672]
-
blk.21.ffn_up.weightQ4_K[8192 28672]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.attn_k.weightQ4_K[8192 1024]
-
blk.21.attn_output.weightQ4_K[8192 8192]
-
blk.21.attn_q.weightQ4_K[8192 8192]
-
blk.21.attn_v.weightQ6_K[8192 1024]
-
blk.22.attn_k.weightQ4_K[8192 1024]
-
blk.22.attn_q.weightQ4_K[8192 8192]
-
blk.22.attn_v.weightQ5_K[8192 1024]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.ffn_down.weightQ4_K[28672 8192]
-
blk.22.ffn_gate.weightQ4_K[8192 28672]
-
blk.22.ffn_up.weightQ4_K[8192 28672]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.22.attn_output.weightQ4_K[8192 8192]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.ffn_down.weightQ6_K[28672 8192]
-
blk.23.ffn_gate.weightQ4_K[8192 28672]
-
blk.23.ffn_up.weightQ4_K[8192 28672]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.23.attn_k.weightQ4_K[8192 1024]
-
blk.23.attn_output.weightQ4_K[8192 8192]
-
blk.23.attn_q.weightQ4_K[8192 8192]
-
blk.23.attn_v.weightQ5_K[8192 1024]
-
blk.24.ffn_down.weightQ4_K[28672 8192]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.ffn_gate.weightQ4_K[8192 28672]
-
blk.24.ffn_up.weightQ4_K[8192 28672]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.attn_k.weightQ4_K[8192 1024]
-
blk.24.attn_output.weightQ4_K[8192 8192]
-
blk.24.attn_q.weightQ4_K[8192 8192]
-
blk.24.attn_v.weightQ6_K[8192 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.ffn_down.weightQ4_K[28672 8192]
-
blk.25.ffn_gate.weightQ4_K[8192 28672]
-
blk.25.ffn_up.weightQ4_K[8192 28672]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.attn_k.weightQ4_K[8192 1024]
-
blk.25.attn_output.weightQ4_K[8192 8192]
-
blk.25.attn_q.weightQ4_K[8192 8192]
-
blk.25.attn_v.weightQ5_K[8192 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.ffn_down.weightQ4_K[28672 8192]
-
blk.26.ffn_gate.weightQ4_K[8192 28672]
-
blk.26.ffn_up.weightQ4_K[8192 28672]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.26.attn_k.weightQ4_K[8192 1024]
-
blk.26.attn_output.weightQ4_K[8192 8192]
-
blk.26.attn_q.weightQ4_K[8192 8192]
-
blk.26.attn_v.weightQ5_K[8192 1024]
-
blk.27.ffn_gate.weightQ4_K[8192 28672]
-
blk.27.ffn_up.weightQ4_K[8192 28672]
-
blk.27.attn_k.weightQ4_K[8192 1024]
-
blk.27.attn_output.weightQ4_K[8192 8192]
-
blk.27.attn_q.weightQ4_K[8192 8192]
-
blk.27.attn_v.weightQ6_K[8192 1024]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.ffn_down.weightQ6_K[28672 8192]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.ffn_down.weightQ4_K[28672 8192]
-
blk.28.ffn_gate.weightQ4_K[8192 28672]
-
blk.28.ffn_up.weightQ4_K[8192 28672]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.attn_k.weightQ4_K[8192 1024]
-
blk.28.attn_output.weightQ4_K[8192 8192]
-
blk.28.attn_q.weightQ4_K[8192 8192]
-
blk.28.attn_v.weightQ5_K[8192 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.ffn_down.weightQ4_K[28672 8192]
-
blk.29.ffn_gate.weightQ4_K[8192 28672]
-
blk.29.ffn_up.weightQ4_K[8192 28672]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.29.attn_k.weightQ4_K[8192 1024]
-
blk.29.attn_output.weightQ4_K[8192 8192]
-
blk.29.attn_q.weightQ4_K[8192 8192]
-
blk.29.attn_v.weightQ6_K[8192 1024]
-
blk.30.ffn_gate.weightQ4_K[8192 28672]
-
blk.30.attn_k.weightQ4_K[8192 1024]
-
blk.30.attn_output.weightQ4_K[8192 8192]
-
blk.30.attn_q.weightQ4_K[8192 8192]
-
blk.30.attn_v.weightQ5_K[8192 1024]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.ffn_down.weightQ6_K[28672 8192]
-
blk.30.ffn_up.weightQ4_K[8192 28672]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.ffn_down.weightQ4_K[28672 8192]
-
blk.31.ffn_gate.weightQ4_K[8192 28672]
-
blk.31.ffn_up.weightQ4_K[8192 28672]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.31.attn_k.weightQ4_K[8192 1024]
-
blk.31.attn_output.weightQ4_K[8192 8192]
-
blk.31.attn_q.weightQ4_K[8192 8192]
-
blk.31.attn_v.weightQ5_K[8192 1024]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.ffn_down.weightQ4_K[28672 8192]
-
blk.32.ffn_gate.weightQ4_K[8192 28672]
-
blk.32.ffn_up.weightQ4_K[8192 28672]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.32.attn_k.weightQ4_K[8192 1024]
-
blk.32.attn_output.weightQ4_K[8192 8192]
-
blk.32.attn_q.weightQ4_K[8192 8192]
-
blk.32.attn_v.weightQ5_K[8192 1024]
-
blk.33.attn_k.weightQ4_K[8192 1024]
-
blk.33.attn_output.weightQ4_K[8192 8192]
-
blk.33.attn_q.weightQ4_K[8192 8192]
-
blk.33.attn_v.weightQ6_K[8192 1024]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.ffn_down.weightQ4_K[28672 8192]
-
blk.33.ffn_gate.weightQ4_K[8192 28672]
-
blk.33.ffn_up.weightQ4_K[8192 28672]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.ffn_down.weightQ4_K[28672 8192]
-
blk.34.ffn_gate.weightQ4_K[8192 28672]
-
blk.34.ffn_up.weightQ4_K[8192 28672]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.34.attn_k.weightQ4_K[8192 1024]
-
blk.34.attn_output.weightQ4_K[8192 8192]
-
blk.34.attn_q.weightQ4_K[8192 8192]
-
blk.34.attn_v.weightQ5_K[8192 1024]
-
blk.35.ffn_down.weightQ6_K[28672 8192]
-
blk.35.ffn_gate.weightQ4_K[8192 28672]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.ffn_up.weightQ4_K[8192 28672]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.35.attn_k.weightQ4_K[8192 1024]
-
blk.35.attn_output.weightQ4_K[8192 8192]
-
blk.35.attn_q.weightQ4_K[8192 8192]
-
blk.35.attn_v.weightQ6_K[8192 1024]
-
blk.36.attn_k.weightQ4_K[8192 1024]
-
blk.36.attn_q.weightQ4_K[8192 8192]
-
blk.36.attn_v.weightQ5_K[8192 1024]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.ffn_down.weightQ6_K[28672 8192]
-
blk.36.ffn_gate.weightQ4_K[8192 28672]
-
blk.36.ffn_up.weightQ4_K[8192 28672]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.attn_output.weightQ4_K[8192 8192]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.ffn_down.weightQ4_K[28672 8192]
-
blk.37.ffn_gate.weightQ4_K[8192 28672]
-
blk.37.ffn_up.weightQ4_K[8192 28672]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.attn_k.weightQ4_K[8192 1024]
-
blk.37.attn_output.weightQ4_K[8192 8192]
-
blk.37.attn_q.weightQ4_K[8192 8192]
-
blk.37.attn_v.weightQ5_K[8192 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.ffn_down.weightQ4_K[28672 8192]
-
blk.38.ffn_gate.weightQ4_K[8192 28672]
-
blk.38.ffn_up.weightQ4_K[8192 28672]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.38.attn_k.weightQ4_K[8192 1024]
-
blk.38.attn_output.weightQ4_K[8192 8192]
-
blk.38.attn_q.weightQ4_K[8192 8192]
-
blk.38.attn_v.weightQ5_K[8192 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.ffn_down.weightQ6_K[28672 8192]
-
blk.39.ffn_gate.weightQ4_K[8192 28672]
-
blk.39.ffn_up.weightQ4_K[8192 28672]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.39.attn_k.weightQ4_K[8192 1024]
-
blk.39.attn_output.weightQ4_K[8192 8192]
-
blk.39.attn_q.weightQ4_K[8192 8192]
-
blk.39.attn_v.weightQ5_K[8192 1024]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.ffn_down.weightQ4_K[28672 8192]
-
blk.40.ffn_gate.weightQ4_K[8192 28672]
-
blk.40.ffn_up.weightQ4_K[8192 28672]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.40.attn_k.weightQ4_K[8192 1024]
-
blk.40.attn_output.weightQ4_K[8192 8192]
-
blk.40.attn_q.weightQ4_K[8192 8192]
-
blk.40.attn_v.weightQ5_K[8192 1024]
-
blk.41.ffn_gate.weightQ4_K[8192 28672]
-
blk.41.ffn_up.weightQ4_K[8192 28672]
-
blk.41.attn_k.weightQ4_K[8192 1024]
-
blk.41.attn_output.weightQ4_K[8192 8192]
-
blk.41.attn_v.weightQ6_K[8192 1024]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.ffn_down.weightQ4_K[28672 8192]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.41.attn_q.weightQ4_K[8192 8192]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.ffn_down.weightQ6_K[28672 8192]
-
blk.42.ffn_gate.weightQ4_K[8192 28672]
-
blk.42.ffn_up.weightQ4_K[8192 28672]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.42.attn_k.weightQ4_K[8192 1024]
-
blk.42.attn_output.weightQ4_K[8192 8192]
-
blk.42.attn_q.weightQ4_K[8192 8192]
-
blk.42.attn_v.weightQ6_K[8192 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.ffn_down.weightQ4_K[28672 8192]
-
blk.43.ffn_gate.weightQ4_K[8192 28672]
-
blk.43.ffn_up.weightQ4_K[8192 28672]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.43.attn_k.weightQ4_K[8192 1024]
-
blk.43.attn_output.weightQ4_K[8192 8192]
-
blk.43.attn_q.weightQ4_K[8192 8192]
-
blk.43.attn_v.weightQ5_K[8192 1024]
-
blk.44.ffn_gate.weightQ4_K[8192 28672]
-
blk.44.attn_k.weightQ4_K[8192 1024]
-
blk.44.attn_output.weightQ4_K[8192 8192]
-
blk.44.attn_q.weightQ4_K[8192 8192]
-
blk.44.attn_v.weightQ5_K[8192 1024]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.ffn_down.weightQ6_K[28672 8192]
-
blk.44.ffn_up.weightQ4_K[8192 28672]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.ffn_down.weightQ4_K[28672 8192]
-
blk.45.ffn_gate.weightQ4_K[8192 28672]
-
blk.45.ffn_up.weightQ4_K[8192 28672]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.attn_k.weightQ4_K[8192 1024]
-
blk.45.attn_output.weightQ4_K[8192 8192]
-
blk.45.attn_q.weightQ4_K[8192 8192]
-
blk.45.attn_v.weightQ5_K[8192 1024]
-
blk.46.ffn_down.weightQ4_K[28672 8192]
-
blk.46.ffn_gate.weightQ4_K[8192 28672]
-
blk.46.ffn_up.weightQ4_K[8192 28672]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.attn_k.weightQ4_K[8192 1024]
-
blk.46.attn_output.weightQ4_K[8192 8192]
-
blk.46.attn_q.weightQ4_K[8192 8192]
-
blk.46.attn_v.weightQ5_K[8192 1024]
-
blk.47.attn_k.weightQ4_K[8192 1024]
-
blk.47.attn_output.weightQ4_K[8192 8192]
-
blk.47.attn_q.weightQ4_K[8192 8192]
-
blk.47.attn_v.weightQ6_K[8192 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.ffn_down.weightQ4_K[28672 8192]
-
blk.47.ffn_gate.weightQ4_K[8192 28672]
-
blk.47.ffn_up.weightQ4_K[8192 28672]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.ffn_down.weightQ6_K[28672 8192]
-
blk.48.ffn_gate.weightQ4_K[8192 28672]
-
blk.48.ffn_up.weightQ4_K[8192 28672]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.48.attn_k.weightQ4_K[8192 1024]
-
blk.48.attn_output.weightQ4_K[8192 8192]
-
blk.48.attn_q.weightQ4_K[8192 8192]
-
blk.48.attn_v.weightQ6_K[8192 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.ffn_down.weightQ4_K[28672 8192]
-
blk.49.ffn_gate.weightQ4_K[8192 28672]
-
blk.49.ffn_up.weightQ4_K[8192 28672]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.49.attn_k.weightQ4_K[8192 1024]
-
blk.49.attn_output.weightQ4_K[8192 8192]
-
blk.49.attn_q.weightQ4_K[8192 8192]
-
blk.49.attn_v.weightQ5_K[8192 1024]
-
blk.50.attn_k.weightQ4_K[8192 1024]
-
blk.50.attn_q.weightQ4_K[8192 8192]
-
blk.50.attn_v.weightQ5_K[8192 1024]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.ffn_down.weightQ6_K[28672 8192]
-
blk.50.ffn_gate.weightQ4_K[8192 28672]
-
blk.50.ffn_up.weightQ4_K[8192 28672]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.50.attn_output.weightQ4_K[8192 8192]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.ffn_down.weightQ4_K[28672 8192]
-
blk.51.ffn_gate.weightQ4_K[8192 28672]
-
blk.51.ffn_up.weightQ4_K[8192 28672]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.51.attn_k.weightQ4_K[8192 1024]
-
blk.51.attn_output.weightQ4_K[8192 8192]
-
blk.51.attn_q.weightQ4_K[8192 8192]
-
blk.51.attn_v.weightQ5_K[8192 1024]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.ffn_down.weightQ4_K[28672 8192]
-
blk.52.ffn_gate.weightQ4_K[8192 28672]
-
blk.52.ffn_up.weightQ4_K[8192 28672]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.52.attn_k.weightQ4_K[8192 1024]
-
blk.52.attn_output.weightQ4_K[8192 8192]
-
blk.52.attn_q.weightQ4_K[8192 8192]
-
blk.52.attn_v.weightQ6_K[8192 1024]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.ffn_down.weightQ4_K[28672 8192]
-
blk.53.ffn_gate.weightQ4_K[8192 28672]
-
blk.53.ffn_up.weightQ4_K[8192 28672]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.53.attn_k.weightQ4_K[8192 1024]
-
blk.53.attn_output.weightQ4_K[8192 8192]
-
blk.53.attn_q.weightQ4_K[8192 8192]
-
blk.53.attn_v.weightQ5_K[8192 1024]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.ffn_down.weightQ6_K[28672 8192]
-
blk.54.ffn_gate.weightQ4_K[8192 28672]
-
blk.54.ffn_up.weightQ4_K[8192 28672]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.54.attn_k.weightQ4_K[8192 1024]
-
blk.54.attn_output.weightQ4_K[8192 8192]
-
blk.54.attn_q.weightQ4_K[8192 8192]
-
blk.54.attn_v.weightQ6_K[8192 1024]
-
blk.55.ffn_gate.weightQ4_K[8192 28672]
-
blk.55.ffn_up.weightQ4_K[8192 28672]
-
blk.55.attn_k.weightQ4_K[8192 1024]
-
blk.55.attn_output.weightQ4_K[8192 8192]
-
blk.55.attn_q.weightQ4_K[8192 8192]
-
blk.55.attn_v.weightQ5_K[8192 1024]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.ffn_down.weightQ4_K[28672 8192]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.ffn_down.weightQ6_K[28672 8192]
-
blk.56.ffn_gate.weightQ4_K[8192 28672]
-
blk.56.ffn_up.weightQ4_K[8192 28672]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.56.attn_k.weightQ4_K[8192 1024]
-
blk.56.attn_output.weightQ4_K[8192 8192]
-
blk.56.attn_q.weightQ4_K[8192 8192]
-
blk.56.attn_v.weightQ6_K[8192 1024]
-
blk.57.ffn_down.weightQ4_K[28672 8192]
-
blk.57.ffn_gate.weightQ4_K[8192 28672]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.ffn_up.weightQ4_K[8192 28672]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.57.attn_k.weightQ4_K[8192 1024]
-
blk.57.attn_output.weightQ4_K[8192 8192]
-
blk.57.attn_q.weightQ4_K[8192 8192]
-
blk.57.attn_v.weightQ5_K[8192 1024]
-
blk.58.ffn_gate.weightQ4_K[8192 28672]
-
blk.58.attn_k.weightQ4_K[8192 1024]
-
blk.58.attn_output.weightQ4_K[8192 8192]
-
blk.58.attn_q.weightQ4_K[8192 8192]
-
blk.58.attn_v.weightQ5_K[8192 1024]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.ffn_down.weightQ4_K[28672 8192]
-
blk.58.ffn_up.weightQ4_K[8192 28672]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.ffn_down.weightQ4_K[28672 8192]
-
blk.59.ffn_gate.weightQ4_K[8192 28672]
-
blk.59.ffn_up.weightQ4_K[8192 28672]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.59.attn_k.weightQ4_K[8192 1024]
-
blk.59.attn_output.weightQ4_K[8192 8192]
-
blk.59.attn_q.weightQ4_K[8192 8192]
-
blk.59.attn_v.weightQ5_K[8192 1024]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.ffn_down.weightQ6_K[28672 8192]
-
blk.60.ffn_gate.weightQ4_K[8192 28672]
-
blk.60.ffn_up.weightQ4_K[8192 28672]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.60.attn_k.weightQ4_K[8192 1024]
-
blk.60.attn_output.weightQ4_K[8192 8192]
-
blk.60.attn_q.weightQ4_K[8192 8192]
-
blk.60.attn_v.weightQ6_K[8192 1024]
-
blk.61.attn_k.weightQ4_K[8192 1024]
-
blk.61.attn_output.weightQ4_K[8192 8192]
-
blk.61.attn_q.weightQ4_K[8192 8192]
-
blk.61.attn_v.weightQ5_K[8192 1024]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.ffn_down.weightQ6_K[28672 8192]
-
blk.61.ffn_gate.weightQ4_K[8192 28672]
-
blk.61.ffn_up.weightQ4_K[8192 28672]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.62.ffn_down.weightQ4_K[28672 8192]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.ffn_gate.weightQ4_K[8192 28672]
-
blk.62.ffn_up.weightQ4_K[8192 28672]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.62.attn_k.weightQ4_K[8192 1024]
-
blk.62.attn_output.weightQ4_K[8192 8192]
-
blk.62.attn_q.weightQ4_K[8192 8192]
-
blk.62.attn_v.weightQ5_K[8192 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.ffn_down.weightQ4_K[28672 8192]
-
blk.63.ffn_gate.weightQ4_K[8192 28672]
-
blk.63.ffn_up.weightQ4_K[8192 28672]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.63.attn_k.weightQ4_K[8192 1024]
-
blk.63.attn_output.weightQ4_K[8192 8192]
-
blk.63.attn_q.weightQ4_K[8192 8192]
-
blk.63.attn_v.weightQ5_K[8192 1024]
-
blk.64.attn_k.weightQ4_K[8192 1024]
-
blk.64.attn_q.weightQ4_K[8192 8192]
-
blk.64.attn_v.weightQ6_K[8192 1024]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.ffn_down.weightQ4_K[28672 8192]
-
blk.64.ffn_gate.weightQ4_K[8192 28672]
-
blk.64.ffn_up.weightQ4_K[8192 28672]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.64.attn_output.weightQ4_K[8192 8192]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.ffn_down.weightQ4_K[28672 8192]
-
blk.65.ffn_gate.weightQ4_K[8192 28672]
-
blk.65.ffn_up.weightQ4_K[8192 28672]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.attn_k.weightQ4_K[8192 1024]
-
blk.65.attn_output.weightQ4_K[8192 8192]
-
blk.65.attn_q.weightQ4_K[8192 8192]
-
blk.65.attn_v.weightQ5_K[8192 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.ffn_down.weightQ6_K[28672 8192]
-
blk.66.ffn_gate.weightQ4_K[8192 28672]
-
blk.66.ffn_up.weightQ4_K[8192 28672]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.66.attn_k.weightQ4_K[8192 1024]
-
blk.66.attn_output.weightQ4_K[8192 8192]
-
blk.66.attn_q.weightQ4_K[8192 8192]
-
blk.66.attn_v.weightQ6_K[8192 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.ffn_down.weightQ4_K[28672 8192]
-
blk.67.ffn_gate.weightQ4_K[8192 28672]
-
blk.67.ffn_up.weightQ4_K[8192 28672]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.67.attn_k.weightQ4_K[8192 1024]
-
blk.67.attn_output.weightQ4_K[8192 8192]
-
blk.67.attn_q.weightQ4_K[8192 8192]
-
blk.67.attn_v.weightQ5_K[8192 1024]
-
blk.68.ffn_down.weightQ4_K[28672 8192]
-
blk.68.ffn_gate.weightQ4_K[8192 28672]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.ffn_up.weightQ4_K[8192 28672]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.68.attn_k.weightQ4_K[8192 1024]
-
blk.68.attn_output.weightQ4_K[8192 8192]
-
blk.68.attn_q.weightQ4_K[8192 8192]
-
blk.68.attn_v.weightQ6_K[8192 1024]
-
blk.69.ffn_gate.weightQ4_K[8192 28672]
-
blk.69.ffn_up.weightQ4_K[8192 28672]
-
blk.69.attn_k.weightQ4_K[8192 1024]
-
blk.69.attn_output.weightQ4_K[8192 8192]
-
blk.69.attn_q.weightQ4_K[8192 8192]
-
blk.69.attn_v.weightQ5_K[8192 1024]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.ffn_down.weightQ6_K[28672 8192]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.ffn_down.weightQ6_K[28672 8192]
-
blk.70.ffn_gate.weightQ4_K[8192 28672]
-
blk.70.ffn_up.weightQ4_K[8192 28672]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.70.attn_k.weightQ4_K[8192 1024]
-
blk.70.attn_output.weightQ4_K[8192 8192]
-
blk.70.attn_q.weightQ4_K[8192 8192]
-
blk.70.attn_v.weightQ6_K[8192 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.ffn_down.weightQ6_K[28672 8192]
-
blk.71.ffn_gate.weightQ4_K[8192 28672]
-
blk.71.ffn_up.weightQ4_K[8192 28672]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.71.attn_k.weightQ4_K[8192 1024]
-
blk.71.attn_output.weightQ4_K[8192 8192]
-
blk.71.attn_q.weightQ4_K[8192 8192]
-
blk.71.attn_v.weightQ6_K[8192 1024]
-
blk.72.ffn_gate.weightQ4_K[8192 28672]
-
blk.72.attn_k.weightQ4_K[8192 1024]
-
blk.72.attn_output.weightQ4_K[8192 8192]
-
blk.72.attn_q.weightQ4_K[8192 8192]
-
blk.72.attn_v.weightQ6_K[8192 1024]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.ffn_down.weightQ6_K[28672 8192]
-
blk.72.ffn_up.weightQ4_K[8192 28672]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.73.ffn_down.weightQ6_K[28672 8192]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.ffn_gate.weightQ4_K[8192 28672]
-
blk.73.ffn_up.weightQ4_K[8192 28672]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.attn_k.weightQ4_K[8192 1024]
-
blk.73.attn_output.weightQ4_K[8192 8192]
-
blk.73.attn_q.weightQ4_K[8192 8192]
-
blk.73.attn_v.weightQ6_K[8192 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.ffn_down.weightQ6_K[28672 8192]
-
blk.74.ffn_gate.weightQ4_K[8192 28672]
-
blk.74.ffn_up.weightQ4_K[8192 28672]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.74.attn_k.weightQ4_K[8192 1024]
-
blk.74.attn_output.weightQ4_K[8192 8192]
-
blk.74.attn_q.weightQ4_K[8192 8192]
-
blk.74.attn_v.weightQ6_K[8192 1024]
-
blk.75.attn_k.weightQ4_K[8192 1024]
-
blk.75.attn_output.weightQ4_K[8192 8192]
-
blk.75.attn_q.weightQ4_K[8192 8192]
-
blk.75.attn_v.weightQ6_K[8192 1024]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.ffn_down.weightQ6_K[28672 8192]
-
blk.75.ffn_gate.weightQ4_K[8192 28672]
-
blk.75.ffn_up.weightQ4_K[8192 28672]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.ffn_down.weightQ6_K[28672 8192]
-
blk.76.ffn_gate.weightQ4_K[8192 28672]
-
blk.76.ffn_up.weightQ4_K[8192 28672]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.attn_k.weightQ4_K[8192 1024]
-
blk.76.attn_output.weightQ4_K[8192 8192]
-
blk.76.attn_q.weightQ4_K[8192 8192]
-
blk.76.attn_v.weightQ6_K[8192 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.ffn_down.weightQ6_K[28672 8192]
-
blk.77.ffn_gate.weightQ4_K[8192 28672]
-
blk.77.ffn_up.weightQ4_K[8192 28672]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.attn_k.weightQ4_K[8192 1024]
-
blk.77.attn_output.weightQ4_K[8192 8192]
-
blk.77.attn_q.weightQ4_K[8192 8192]
-
blk.77.attn_v.weightQ6_K[8192 1024]
-
blk.78.ffn_down.weightQ6_K[28672 8192]
-
blk.78.attn_k.weightQ4_K[8192 1024]
-
blk.78.attn_q.weightQ4_K[8192 8192]
-
blk.78.attn_v.weightQ6_K[8192 1024]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.ffn_gate.weightQ4_K[8192 28672]
-
blk.78.ffn_up.weightQ4_K[8192 28672]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.78.attn_output.weightQ4_K[8192 8192]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.ffn_down.weightQ6_K[28672 8192]
-
blk.79.ffn_gate.weightQ4_K[8192 28672]
-
blk.79.ffn_up.weightQ4_K[8192 28672]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.79.attn_k.weightQ4_K[8192 1024]
-
blk.79.attn_output.weightQ4_K[8192 8192]
-
blk.79.attn_q.weightQ4_K[8192 8192]
-
blk.79.attn_v.weightQ6_K[8192 1024]
-
output.weightF16[8192 32000]
-
output_norm.weightF32[8192]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79