latest
18GB
Codestral model with an optimised system prompt and parameters specifically for coding.
22B
264 Pulls Updated 3 months ago
06d97ad0738b · 18GB
-
quantize.imatrix.chunks_count74
-
quantize.imatrix.datasetgroup_40.txt
-
quantize.imatrix.entries_count392
-
quantize.imatrix.file./imatrix.dat
-
general.architecturellama
-
general.file_typeQ6_K
-
llama.attention.head_count48
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count56
-
llama.context_length32768
-
llama.embedding_length6144
-
llama.feed_forward_length16384
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+06
-
llama.vocab_size32768
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixtrue
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[2 3 3 3 3 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> [INST] [/INST] ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ6_K[6144 32768]
-
blk.0.attn_norm.weightF32[6144]
-
blk.0.ffn_down.weightQ6_K[16384 6144]
-
blk.0.ffn_gate.weightQ6_K[6144 16384]
-
blk.0.ffn_up.weightQ6_K[6144 16384]
-
blk.0.ffn_norm.weightF32[6144]
-
blk.0.attn_k.weightQ6_K[6144 1024]
-
blk.0.attn_output.weightQ6_K[6144 6144]
-
blk.0.attn_q.weightQ6_K[6144 6144]
-
blk.0.attn_v.weightQ6_K[6144 1024]
-
blk.1.attn_norm.weightF32[6144]
-
blk.1.ffn_down.weightQ6_K[16384 6144]
-
blk.1.ffn_gate.weightQ6_K[6144 16384]
-
blk.1.ffn_up.weightQ6_K[6144 16384]
-
blk.1.ffn_norm.weightF32[6144]
-
blk.1.attn_k.weightQ6_K[6144 1024]
-
blk.1.attn_output.weightQ6_K[6144 6144]
-
blk.1.attn_q.weightQ6_K[6144 6144]
-
blk.1.attn_v.weightQ6_K[6144 1024]
-
blk.2.attn_norm.weightF32[6144]
-
blk.2.ffn_down.weightQ6_K[16384 6144]
-
blk.2.ffn_gate.weightQ6_K[6144 16384]
-
blk.2.ffn_up.weightQ6_K[6144 16384]
-
blk.2.ffn_norm.weightF32[6144]
-
blk.2.attn_k.weightQ6_K[6144 1024]
-
blk.2.attn_output.weightQ6_K[6144 6144]
-
blk.2.attn_q.weightQ6_K[6144 6144]
-
blk.2.attn_v.weightQ6_K[6144 1024]
-
blk.3.attn_norm.weightF32[6144]
-
blk.3.ffn_down.weightQ6_K[16384 6144]
-
blk.3.ffn_gate.weightQ6_K[6144 16384]
-
blk.3.ffn_up.weightQ6_K[6144 16384]
-
blk.3.ffn_norm.weightF32[6144]
-
blk.3.attn_k.weightQ6_K[6144 1024]
-
blk.3.attn_output.weightQ6_K[6144 6144]
-
blk.3.attn_q.weightQ6_K[6144 6144]
-
blk.3.attn_v.weightQ6_K[6144 1024]
-
blk.4.attn_norm.weightF32[6144]
-
blk.4.ffn_down.weightQ6_K[16384 6144]
-
blk.4.ffn_gate.weightQ6_K[6144 16384]
-
blk.4.ffn_up.weightQ6_K[6144 16384]
-
blk.4.ffn_norm.weightF32[6144]
-
blk.4.attn_k.weightQ6_K[6144 1024]
-
blk.4.attn_output.weightQ6_K[6144 6144]
-
blk.4.attn_q.weightQ6_K[6144 6144]
-
blk.4.attn_v.weightQ6_K[6144 1024]
-
blk.5.ffn_gate.weightQ6_K[6144 16384]
-
blk.5.ffn_up.weightQ6_K[6144 16384]
-
blk.5.attn_k.weightQ6_K[6144 1024]
-
blk.5.attn_output.weightQ6_K[6144 6144]
-
blk.5.attn_q.weightQ6_K[6144 6144]
-
blk.5.attn_v.weightQ6_K[6144 1024]
-
blk.5.attn_norm.weightF32[6144]
-
blk.5.ffn_down.weightQ6_K[16384 6144]
-
blk.5.ffn_norm.weightF32[6144]
-
blk.6.attn_norm.weightF32[6144]
-
blk.6.ffn_down.weightQ6_K[16384 6144]
-
blk.6.ffn_gate.weightQ6_K[6144 16384]
-
blk.6.ffn_up.weightQ6_K[6144 16384]
-
blk.6.ffn_norm.weightF32[6144]
-
blk.6.attn_k.weightQ6_K[6144 1024]
-
blk.6.attn_output.weightQ6_K[6144 6144]
-
blk.6.attn_q.weightQ6_K[6144 6144]
-
blk.6.attn_v.weightQ6_K[6144 1024]
-
blk.7.attn_norm.weightF32[6144]
-
blk.7.ffn_down.weightQ6_K[16384 6144]
-
blk.7.ffn_gate.weightQ6_K[6144 16384]
-
blk.7.ffn_up.weightQ6_K[6144 16384]
-
blk.7.ffn_norm.weightF32[6144]
-
blk.7.attn_k.weightQ6_K[6144 1024]
-
blk.7.attn_output.weightQ6_K[6144 6144]
-
blk.7.attn_q.weightQ6_K[6144 6144]
-
blk.7.attn_v.weightQ6_K[6144 1024]
-
blk.8.attn_norm.weightF32[6144]
-
blk.8.ffn_down.weightQ6_K[16384 6144]
-
blk.8.ffn_gate.weightQ6_K[6144 16384]
-
blk.8.ffn_up.weightQ6_K[6144 16384]
-
blk.8.ffn_norm.weightF32[6144]
-
blk.8.attn_k.weightQ6_K[6144 1024]
-
blk.8.attn_output.weightQ6_K[6144 6144]
-
blk.8.attn_q.weightQ6_K[6144 6144]
-
blk.8.attn_v.weightQ6_K[6144 1024]
-
blk.9.attn_norm.weightF32[6144]
-
blk.9.ffn_down.weightQ6_K[16384 6144]
-
blk.9.ffn_gate.weightQ6_K[6144 16384]
-
blk.9.ffn_up.weightQ6_K[6144 16384]
-
blk.9.ffn_norm.weightF32[6144]
-
blk.9.attn_k.weightQ6_K[6144 1024]
-
blk.9.attn_output.weightQ6_K[6144 6144]
-
blk.9.attn_q.weightQ6_K[6144 6144]
-
blk.9.attn_v.weightQ6_K[6144 1024]
-
blk.10.attn_norm.weightF32[6144]
-
blk.10.ffn_down.weightQ6_K[16384 6144]
-
blk.10.ffn_gate.weightQ6_K[6144 16384]
-
blk.10.ffn_up.weightQ6_K[6144 16384]
-
blk.10.ffn_norm.weightF32[6144]
-
blk.10.attn_k.weightQ6_K[6144 1024]
-
blk.10.attn_output.weightQ6_K[6144 6144]
-
blk.10.attn_q.weightQ6_K[6144 6144]
-
blk.10.attn_v.weightQ6_K[6144 1024]
-
blk.11.attn_norm.weightF32[6144]
-
blk.11.ffn_down.weightQ6_K[16384 6144]
-
blk.11.ffn_gate.weightQ6_K[6144 16384]
-
blk.11.ffn_up.weightQ6_K[6144 16384]
-
blk.11.ffn_norm.weightF32[6144]
-
blk.11.attn_k.weightQ6_K[6144 1024]
-
blk.11.attn_output.weightQ6_K[6144 6144]
-
blk.11.attn_q.weightQ6_K[6144 6144]
-
blk.11.attn_v.weightQ6_K[6144 1024]
-
blk.12.attn_k.weightQ6_K[6144 1024]
-
blk.12.attn_q.weightQ6_K[6144 6144]
-
blk.12.attn_v.weightQ6_K[6144 1024]
-
blk.12.attn_norm.weightF32[6144]
-
blk.12.ffn_down.weightQ6_K[16384 6144]
-
blk.12.ffn_gate.weightQ6_K[6144 16384]
-
blk.12.ffn_up.weightQ6_K[6144 16384]
-
blk.12.ffn_norm.weightF32[6144]
-
blk.12.attn_output.weightQ6_K[6144 6144]
-
blk.13.attn_norm.weightF32[6144]
-
blk.13.ffn_down.weightQ6_K[16384 6144]
-
blk.13.ffn_gate.weightQ6_K[6144 16384]
-
blk.13.ffn_up.weightQ6_K[6144 16384]
-
blk.13.ffn_norm.weightF32[6144]
-
blk.13.attn_k.weightQ6_K[6144 1024]
-
blk.13.attn_output.weightQ6_K[6144 6144]
-
blk.13.attn_q.weightQ6_K[6144 6144]
-
blk.13.attn_v.weightQ6_K[6144 1024]
-
blk.14.attn_norm.weightF32[6144]
-
blk.14.ffn_down.weightQ6_K[16384 6144]
-
blk.14.ffn_gate.weightQ6_K[6144 16384]
-
blk.14.ffn_up.weightQ6_K[6144 16384]
-
blk.14.ffn_norm.weightF32[6144]
-
blk.14.attn_k.weightQ6_K[6144 1024]
-
blk.14.attn_output.weightQ6_K[6144 6144]
-
blk.14.attn_q.weightQ6_K[6144 6144]
-
blk.14.attn_v.weightQ6_K[6144 1024]
-
blk.15.attn_norm.weightF32[6144]
-
blk.15.ffn_down.weightQ6_K[16384 6144]
-
blk.15.ffn_gate.weightQ6_K[6144 16384]
-
blk.15.ffn_up.weightQ6_K[6144 16384]
-
blk.15.ffn_norm.weightF32[6144]
-
blk.15.attn_k.weightQ6_K[6144 1024]
-
blk.15.attn_output.weightQ6_K[6144 6144]
-
blk.15.attn_q.weightQ6_K[6144 6144]
-
blk.15.attn_v.weightQ6_K[6144 1024]
-
blk.16.attn_norm.weightF32[6144]
-
blk.16.ffn_down.weightQ6_K[16384 6144]
-
blk.16.ffn_gate.weightQ6_K[6144 16384]
-
blk.16.ffn_up.weightQ6_K[6144 16384]
-
blk.16.ffn_norm.weightF32[6144]
-
blk.16.attn_k.weightQ6_K[6144 1024]
-
blk.16.attn_output.weightQ6_K[6144 6144]
-
blk.16.attn_q.weightQ6_K[6144 6144]
-
blk.16.attn_v.weightQ6_K[6144 1024]
-
blk.17.attn_norm.weightF32[6144]
-
blk.17.ffn_down.weightQ6_K[16384 6144]
-
blk.17.ffn_gate.weightQ6_K[6144 16384]
-
blk.17.ffn_up.weightQ6_K[6144 16384]
-
blk.17.ffn_norm.weightF32[6144]
-
blk.17.attn_k.weightQ6_K[6144 1024]
-
blk.17.attn_output.weightQ6_K[6144 6144]
-
blk.17.attn_q.weightQ6_K[6144 6144]
-
blk.17.attn_v.weightQ6_K[6144 1024]
-
blk.18.ffn_gate.weightQ6_K[6144 16384]
-
blk.18.attn_k.weightQ6_K[6144 1024]
-
blk.18.attn_output.weightQ6_K[6144 6144]
-
blk.18.attn_q.weightQ6_K[6144 6144]
-
blk.18.attn_v.weightQ6_K[6144 1024]
-
blk.18.attn_norm.weightF32[6144]
-
blk.18.ffn_down.weightQ6_K[16384 6144]
-
blk.18.ffn_up.weightQ6_K[6144 16384]
-
blk.18.ffn_norm.weightF32[6144]
-
blk.19.attn_norm.weightF32[6144]
-
blk.19.ffn_down.weightQ6_K[16384 6144]
-
blk.19.ffn_gate.weightQ6_K[6144 16384]
-
blk.19.ffn_up.weightQ6_K[6144 16384]
-
blk.19.ffn_norm.weightF32[6144]
-
blk.19.attn_k.weightQ6_K[6144 1024]
-
blk.19.attn_output.weightQ6_K[6144 6144]
-
blk.19.attn_q.weightQ6_K[6144 6144]
-
blk.19.attn_v.weightQ6_K[6144 1024]
-
blk.20.attn_norm.weightF32[6144]
-
blk.20.ffn_down.weightQ6_K[16384 6144]
-
blk.20.ffn_gate.weightQ6_K[6144 16384]
-
blk.20.ffn_up.weightQ6_K[6144 16384]
-
blk.20.ffn_norm.weightF32[6144]
-
blk.20.attn_k.weightQ6_K[6144 1024]
-
blk.20.attn_output.weightQ6_K[6144 6144]
-
blk.20.attn_q.weightQ6_K[6144 6144]
-
blk.20.attn_v.weightQ6_K[6144 1024]
-
blk.21.attn_norm.weightF32[6144]
-
blk.21.ffn_down.weightQ6_K[16384 6144]
-
blk.21.ffn_gate.weightQ6_K[6144 16384]
-
blk.21.ffn_up.weightQ6_K[6144 16384]
-
blk.21.ffn_norm.weightF32[6144]
-
blk.21.attn_k.weightQ6_K[6144 1024]
-
blk.21.attn_output.weightQ6_K[6144 6144]
-
blk.21.attn_q.weightQ6_K[6144 6144]
-
blk.21.attn_v.weightQ6_K[6144 1024]
-
blk.22.attn_norm.weightF32[6144]
-
blk.22.ffn_down.weightQ6_K[16384 6144]
-
blk.22.ffn_gate.weightQ6_K[6144 16384]
-
blk.22.ffn_up.weightQ6_K[6144 16384]
-
blk.22.ffn_norm.weightF32[6144]
-
blk.22.attn_k.weightQ6_K[6144 1024]
-
blk.22.attn_output.weightQ6_K[6144 6144]
-
blk.22.attn_q.weightQ6_K[6144 6144]
-
blk.22.attn_v.weightQ6_K[6144 1024]
-
blk.23.attn_norm.weightF32[6144]
-
blk.23.ffn_down.weightQ6_K[16384 6144]
-
blk.23.ffn_gate.weightQ6_K[6144 16384]
-
blk.23.ffn_up.weightQ6_K[6144 16384]
-
blk.23.ffn_norm.weightF32[6144]
-
blk.23.attn_k.weightQ6_K[6144 1024]
-
blk.23.attn_output.weightQ6_K[6144 6144]
-
blk.23.attn_q.weightQ6_K[6144 6144]
-
blk.23.attn_v.weightQ6_K[6144 1024]
-
blk.24.ffn_gate.weightQ6_K[6144 16384]
-
blk.24.ffn_up.weightQ6_K[6144 16384]
-
blk.24.attn_k.weightQ6_K[6144 1024]
-
blk.24.attn_output.weightQ6_K[6144 6144]
-
blk.24.attn_q.weightQ6_K[6144 6144]
-
blk.24.attn_v.weightQ6_K[6144 1024]
-
blk.24.attn_norm.weightF32[6144]
-
blk.24.ffn_down.weightQ6_K[16384 6144]
-
blk.24.ffn_norm.weightF32[6144]
-
blk.25.attn_norm.weightF32[6144]
-
blk.25.ffn_down.weightQ6_K[16384 6144]
-
blk.25.ffn_gate.weightQ6_K[6144 16384]
-
blk.25.ffn_up.weightQ6_K[6144 16384]
-
blk.25.ffn_norm.weightF32[6144]
-
blk.25.attn_k.weightQ6_K[6144 1024]
-
blk.25.attn_output.weightQ6_K[6144 6144]
-
blk.25.attn_q.weightQ6_K[6144 6144]
-
blk.25.attn_v.weightQ6_K[6144 1024]
-
blk.26.attn_norm.weightF32[6144]
-
blk.26.ffn_down.weightQ6_K[16384 6144]
-
blk.26.ffn_gate.weightQ6_K[6144 16384]
-
blk.26.ffn_up.weightQ6_K[6144 16384]
-
blk.26.ffn_norm.weightF32[6144]
-
blk.26.attn_k.weightQ6_K[6144 1024]
-
blk.26.attn_output.weightQ6_K[6144 6144]
-
blk.26.attn_q.weightQ6_K[6144 6144]
-
blk.26.attn_v.weightQ6_K[6144 1024]
-
blk.27.attn_norm.weightF32[6144]
-
blk.27.ffn_down.weightQ6_K[16384 6144]
-
blk.27.ffn_gate.weightQ6_K[6144 16384]
-
blk.27.ffn_up.weightQ6_K[6144 16384]
-
blk.27.ffn_norm.weightF32[6144]
-
blk.27.attn_k.weightQ6_K[6144 1024]
-
blk.27.attn_output.weightQ6_K[6144 6144]
-
blk.27.attn_q.weightQ6_K[6144 6144]
-
blk.27.attn_v.weightQ6_K[6144 1024]
-
blk.28.attn_norm.weightF32[6144]
-
blk.28.ffn_down.weightQ6_K[16384 6144]
-
blk.28.ffn_gate.weightQ6_K[6144 16384]
-
blk.28.ffn_up.weightQ6_K[6144 16384]
-
blk.28.ffn_norm.weightF32[6144]
-
blk.28.attn_k.weightQ6_K[6144 1024]
-
blk.28.attn_output.weightQ6_K[6144 6144]
-
blk.28.attn_q.weightQ6_K[6144 6144]
-
blk.28.attn_v.weightQ6_K[6144 1024]
-
blk.29.attn_norm.weightF32[6144]
-
blk.29.ffn_down.weightQ6_K[16384 6144]
-
blk.29.ffn_gate.weightQ6_K[6144 16384]
-
blk.29.ffn_up.weightQ6_K[6144 16384]
-
blk.29.ffn_norm.weightF32[6144]
-
blk.29.attn_k.weightQ6_K[6144 1024]
-
blk.29.attn_output.weightQ6_K[6144 6144]
-
blk.29.attn_q.weightQ6_K[6144 6144]
-
blk.29.attn_v.weightQ6_K[6144 1024]
-
blk.30.attn_norm.weightF32[6144]
-
blk.30.ffn_down.weightQ6_K[16384 6144]
-
blk.30.ffn_gate.weightQ6_K[6144 16384]
-
blk.30.ffn_up.weightQ6_K[6144 16384]
-
blk.30.ffn_norm.weightF32[6144]
-
blk.30.attn_k.weightQ6_K[6144 1024]
-
blk.30.attn_output.weightQ6_K[6144 6144]
-
blk.30.attn_q.weightQ6_K[6144 6144]
-
blk.30.attn_v.weightQ6_K[6144 1024]
-
blk.31.attn_k.weightQ6_K[6144 1024]
-
blk.31.attn_q.weightQ6_K[6144 6144]
-
blk.31.attn_v.weightQ6_K[6144 1024]
-
blk.31.attn_norm.weightF32[6144]
-
blk.31.ffn_down.weightQ6_K[16384 6144]
-
blk.31.ffn_gate.weightQ6_K[6144 16384]
-
blk.31.ffn_up.weightQ6_K[6144 16384]
-
blk.31.ffn_norm.weightF32[6144]
-
blk.31.attn_output.weightQ6_K[6144 6144]
-
blk.32.attn_norm.weightF32[6144]
-
blk.32.ffn_down.weightQ6_K[16384 6144]
-
blk.32.ffn_gate.weightQ6_K[6144 16384]
-
blk.32.ffn_up.weightQ6_K[6144 16384]
-
blk.32.ffn_norm.weightF32[6144]
-
blk.32.attn_k.weightQ6_K[6144 1024]
-
blk.32.attn_output.weightQ6_K[6144 6144]
-
blk.32.attn_q.weightQ6_K[6144 6144]
-
blk.32.attn_v.weightQ6_K[6144 1024]
-
blk.33.attn_norm.weightF32[6144]
-
blk.33.ffn_down.weightQ6_K[16384 6144]
-
blk.33.ffn_gate.weightQ6_K[6144 16384]
-
blk.33.ffn_up.weightQ6_K[6144 16384]
-
blk.33.ffn_norm.weightF32[6144]
-
blk.33.attn_k.weightQ6_K[6144 1024]
-
blk.33.attn_output.weightQ6_K[6144 6144]
-
blk.33.attn_q.weightQ6_K[6144 6144]
-
blk.33.attn_v.weightQ6_K[6144 1024]
-
blk.34.attn_norm.weightF32[6144]
-
blk.34.ffn_down.weightQ6_K[16384 6144]
-
blk.34.ffn_gate.weightQ6_K[6144 16384]
-
blk.34.ffn_up.weightQ6_K[6144 16384]
-
blk.34.ffn_norm.weightF32[6144]
-
blk.34.attn_k.weightQ6_K[6144 1024]
-
blk.34.attn_output.weightQ6_K[6144 6144]
-
blk.34.attn_q.weightQ6_K[6144 6144]
-
blk.34.attn_v.weightQ6_K[6144 1024]
-
blk.35.attn_norm.weightF32[6144]
-
blk.35.ffn_down.weightQ6_K[16384 6144]
-
blk.35.ffn_gate.weightQ6_K[6144 16384]
-
blk.35.ffn_up.weightQ6_K[6144 16384]
-
blk.35.ffn_norm.weightF32[6144]
-
blk.35.attn_k.weightQ6_K[6144 1024]
-
blk.35.attn_output.weightQ6_K[6144 6144]
-
blk.35.attn_q.weightQ6_K[6144 6144]
-
blk.35.attn_v.weightQ6_K[6144 1024]
-
blk.36.attn_norm.weightF32[6144]
-
blk.36.ffn_down.weightQ6_K[16384 6144]
-
blk.36.ffn_gate.weightQ6_K[6144 16384]
-
blk.36.ffn_up.weightQ6_K[6144 16384]
-
blk.36.ffn_norm.weightF32[6144]
-
blk.36.attn_k.weightQ6_K[6144 1024]
-
blk.36.attn_output.weightQ6_K[6144 6144]
-
blk.36.attn_q.weightQ6_K[6144 6144]
-
blk.36.attn_v.weightQ6_K[6144 1024]
-
blk.37.ffn_gate.weightQ6_K[6144 16384]
-
blk.37.attn_k.weightQ6_K[6144 1024]
-
blk.37.attn_output.weightQ6_K[6144 6144]
-
blk.37.attn_q.weightQ6_K[6144 6144]
-
blk.37.attn_v.weightQ6_K[6144 1024]
-
blk.37.attn_norm.weightF32[6144]
-
blk.37.ffn_down.weightQ6_K[16384 6144]
-
blk.37.ffn_up.weightQ6_K[6144 16384]
-
blk.37.ffn_norm.weightF32[6144]
-
blk.38.attn_norm.weightF32[6144]
-
blk.38.ffn_down.weightQ6_K[16384 6144]
-
blk.38.ffn_gate.weightQ6_K[6144 16384]
-
blk.38.ffn_up.weightQ6_K[6144 16384]
-
blk.38.ffn_norm.weightF32[6144]
-
blk.38.attn_k.weightQ6_K[6144 1024]
-
blk.38.attn_output.weightQ6_K[6144 6144]
-
blk.38.attn_q.weightQ6_K[6144 6144]
-
blk.38.attn_v.weightQ6_K[6144 1024]
-
blk.39.attn_norm.weightF32[6144]
-
blk.39.ffn_down.weightQ6_K[16384 6144]
-
blk.39.ffn_gate.weightQ6_K[6144 16384]
-
blk.39.ffn_up.weightQ6_K[6144 16384]
-
blk.39.ffn_norm.weightF32[6144]
-
blk.39.attn_k.weightQ6_K[6144 1024]
-
blk.39.attn_output.weightQ6_K[6144 6144]
-
blk.39.attn_q.weightQ6_K[6144 6144]
-
blk.39.attn_v.weightQ6_K[6144 1024]
-
blk.40.attn_norm.weightF32[6144]
-
blk.40.ffn_down.weightQ6_K[16384 6144]
-
blk.40.ffn_gate.weightQ6_K[6144 16384]
-
blk.40.ffn_up.weightQ6_K[6144 16384]
-
blk.40.ffn_norm.weightF32[6144]
-
blk.40.attn_k.weightQ6_K[6144 1024]
-
blk.40.attn_output.weightQ6_K[6144 6144]
-
blk.40.attn_q.weightQ6_K[6144 6144]
-
blk.40.attn_v.weightQ6_K[6144 1024]
-
blk.41.attn_norm.weightF32[6144]
-
blk.41.ffn_down.weightQ6_K[16384 6144]
-
blk.41.ffn_gate.weightQ6_K[6144 16384]
-
blk.41.ffn_up.weightQ6_K[6144 16384]
-
blk.41.ffn_norm.weightF32[6144]
-
blk.41.attn_k.weightQ6_K[6144 1024]
-
blk.41.attn_output.weightQ6_K[6144 6144]
-
blk.41.attn_q.weightQ6_K[6144 6144]
-
blk.41.attn_v.weightQ6_K[6144 1024]
-
blk.42.attn_norm.weightF32[6144]
-
blk.42.ffn_down.weightQ6_K[16384 6144]
-
blk.42.ffn_gate.weightQ6_K[6144 16384]
-
blk.42.ffn_up.weightQ6_K[6144 16384]
-
blk.42.ffn_norm.weightF32[6144]
-
blk.42.attn_k.weightQ6_K[6144 1024]
-
blk.42.attn_output.weightQ6_K[6144 6144]
-
blk.42.attn_q.weightQ6_K[6144 6144]
-
blk.42.attn_v.weightQ6_K[6144 1024]
-
blk.43.ffn_gate.weightQ6_K[6144 16384]
-
blk.43.ffn_up.weightQ6_K[6144 16384]
-
blk.43.attn_k.weightQ6_K[6144 1024]
-
blk.43.attn_output.weightQ6_K[6144 6144]
-
blk.43.attn_q.weightQ6_K[6144 6144]
-
blk.43.attn_v.weightQ6_K[6144 1024]
-
blk.43.attn_norm.weightF32[6144]
-
blk.43.ffn_down.weightQ6_K[16384 6144]
-
blk.43.ffn_norm.weightF32[6144]
-
blk.44.attn_norm.weightF32[6144]
-
blk.44.ffn_down.weightQ6_K[16384 6144]
-
blk.44.ffn_gate.weightQ6_K[6144 16384]
-
blk.44.ffn_up.weightQ6_K[6144 16384]
-
blk.44.ffn_norm.weightF32[6144]
-
blk.44.attn_k.weightQ6_K[6144 1024]
-
blk.44.attn_output.weightQ6_K[6144 6144]
-
blk.44.attn_q.weightQ6_K[6144 6144]
-
blk.44.attn_v.weightQ6_K[6144 1024]
-
blk.45.attn_norm.weightF32[6144]
-
blk.45.ffn_down.weightQ6_K[16384 6144]
-
blk.45.ffn_gate.weightQ6_K[6144 16384]
-
blk.45.ffn_up.weightQ6_K[6144 16384]
-
blk.45.ffn_norm.weightF32[6144]
-
blk.45.attn_k.weightQ6_K[6144 1024]
-
blk.45.attn_output.weightQ6_K[6144 6144]
-
blk.45.attn_q.weightQ6_K[6144 6144]
-
blk.45.attn_v.weightQ6_K[6144 1024]
-
blk.46.attn_norm.weightF32[6144]
-
blk.46.ffn_down.weightQ6_K[16384 6144]
-
blk.46.ffn_gate.weightQ6_K[6144 16384]
-
blk.46.ffn_up.weightQ6_K[6144 16384]
-
blk.46.ffn_norm.weightF32[6144]
-
blk.46.attn_k.weightQ6_K[6144 1024]
-
blk.46.attn_output.weightQ6_K[6144 6144]
-
blk.46.attn_q.weightQ6_K[6144 6144]
-
blk.46.attn_v.weightQ6_K[6144 1024]
-
blk.47.attn_norm.weightF32[6144]
-
blk.47.ffn_down.weightQ6_K[16384 6144]
-
blk.47.ffn_gate.weightQ6_K[6144 16384]
-
blk.47.ffn_up.weightQ6_K[6144 16384]
-
blk.47.ffn_norm.weightF32[6144]
-
blk.47.attn_k.weightQ6_K[6144 1024]
-
blk.47.attn_output.weightQ6_K[6144 6144]
-
blk.47.attn_q.weightQ6_K[6144 6144]
-
blk.47.attn_v.weightQ6_K[6144 1024]
-
blk.48.attn_norm.weightF32[6144]
-
blk.48.ffn_down.weightQ6_K[16384 6144]
-
blk.48.ffn_gate.weightQ6_K[6144 16384]
-
blk.48.ffn_up.weightQ6_K[6144 16384]
-
blk.48.ffn_norm.weightF32[6144]
-
blk.48.attn_k.weightQ6_K[6144 1024]
-
blk.48.attn_output.weightQ6_K[6144 6144]
-
blk.48.attn_q.weightQ6_K[6144 6144]
-
blk.48.attn_v.weightQ6_K[6144 1024]
-
blk.49.attn_norm.weightF32[6144]
-
blk.49.ffn_down.weightQ6_K[16384 6144]
-
blk.49.ffn_gate.weightQ6_K[6144 16384]
-
blk.49.ffn_up.weightQ6_K[6144 16384]
-
blk.49.ffn_norm.weightF32[6144]
-
blk.49.attn_k.weightQ6_K[6144 1024]
-
blk.49.attn_output.weightQ6_K[6144 6144]
-
blk.49.attn_q.weightQ6_K[6144 6144]
-
blk.49.attn_v.weightQ6_K[6144 1024]
-
blk.50.attn_k.weightQ6_K[6144 1024]
-
blk.50.attn_q.weightQ6_K[6144 6144]
-
blk.50.attn_v.weightQ6_K[6144 1024]
-
blk.50.attn_norm.weightF32[6144]
-
blk.50.ffn_down.weightQ6_K[16384 6144]
-
blk.50.ffn_gate.weightQ6_K[6144 16384]
-
blk.50.ffn_up.weightQ6_K[6144 16384]
-
blk.50.ffn_norm.weightF32[6144]
-
blk.50.attn_output.weightQ6_K[6144 6144]
-
blk.51.attn_norm.weightF32[6144]
-
blk.51.ffn_down.weightQ6_K[16384 6144]
-
blk.51.ffn_gate.weightQ6_K[6144 16384]
-
blk.51.ffn_up.weightQ6_K[6144 16384]
-
blk.51.ffn_norm.weightF32[6144]
-
blk.51.attn_k.weightQ6_K[6144 1024]
-
blk.51.attn_output.weightQ6_K[6144 6144]
-
blk.51.attn_q.weightQ6_K[6144 6144]
-
blk.51.attn_v.weightQ6_K[6144 1024]
-
blk.52.attn_norm.weightF32[6144]
-
blk.52.ffn_down.weightQ6_K[16384 6144]
-
blk.52.ffn_gate.weightQ6_K[6144 16384]
-
blk.52.ffn_up.weightQ6_K[6144 16384]
-
blk.52.ffn_norm.weightF32[6144]
-
blk.52.attn_k.weightQ6_K[6144 1024]
-
blk.52.attn_output.weightQ6_K[6144 6144]
-
blk.52.attn_q.weightQ6_K[6144 6144]
-
blk.52.attn_v.weightQ6_K[6144 1024]
-
blk.53.attn_norm.weightF32[6144]
-
blk.53.ffn_down.weightQ6_K[16384 6144]
-
blk.53.ffn_gate.weightQ6_K[6144 16384]
-
blk.53.ffn_up.weightQ6_K[6144 16384]
-
blk.53.ffn_norm.weightF32[6144]
-
blk.53.attn_k.weightQ6_K[6144 1024]
-
blk.53.attn_output.weightQ6_K[6144 6144]
-
blk.53.attn_q.weightQ6_K[6144 6144]
-
blk.53.attn_v.weightQ6_K[6144 1024]
-
blk.54.attn_norm.weightF32[6144]
-
blk.54.ffn_down.weightQ6_K[16384 6144]
-
blk.54.ffn_gate.weightQ6_K[6144 16384]
-
blk.54.ffn_up.weightQ6_K[6144 16384]
-
blk.54.ffn_norm.weightF32[6144]
-
blk.54.attn_k.weightQ6_K[6144 1024]
-
blk.54.attn_output.weightQ6_K[6144 6144]
-
blk.54.attn_q.weightQ6_K[6144 6144]
-
blk.54.attn_v.weightQ6_K[6144 1024]
-
blk.55.attn_norm.weightF32[6144]
-
blk.55.ffn_down.weightQ6_K[16384 6144]
-
blk.55.ffn_gate.weightQ6_K[6144 16384]
-
blk.55.ffn_up.weightQ6_K[6144 16384]
-
blk.55.ffn_norm.weightF32[6144]
-
blk.55.attn_k.weightQ6_K[6144 1024]
-
blk.55.attn_output.weightQ6_K[6144 6144]
-
blk.55.attn_q.weightQ6_K[6144 6144]
-
blk.55.attn_v.weightQ6_K[6144 1024]
-
output.weightQ6_K[6144 32768]
-
output_norm.weightF32[6144]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55