Trinity is a coding specific Large Language Model series created by Migel Tissera.
22B
5 Pulls Updated 3 days ago
5fb0375a00bd · 13GB
-
quantize.imatrix.chunks_count148
-
quantize.imatrix.dataset/training_dir/calibration_datav3.txt
-
quantize.imatrix.entries_count392
-
quantize.imatrix.file/models_out/Trinity-2-Codestral-22B-v0.2-GGUF/Trinity-2-Codestral-22B-v0.2.imatrix
-
general.architecturellama
-
general.file_typeQ4_K_M
-
llama.attention.head_count48
-
llama.attention.head_count_kv8
-
llama.attention.key_length128
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.attention.value_length128
-
llama.block_count56
-
llama.context_length32768
-
llama.embedding_length6144
-
llama.feed_forward_length16384
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+06
-
llama.vocab_size32771
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixtrue
-
tokenizer.ggml.bos_token_id32768
-
tokenizer.ggml.eos_token_id32769
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id32770
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000 -1000 -1000 -1000 -1000 ...]
-
tokenizer.ggml.token_type[3 3 3 4 4 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> [INST] [/INST] ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ4_K[6144 32771]
-
blk.0.attn_norm.weightF32[6144]
-
blk.0.ffn_down.weightQ6_K[16384 6144]
-
blk.0.ffn_gate.weightQ4_K[6144 16384]
-
blk.0.ffn_up.weightQ4_K[6144 16384]
-
blk.0.ffn_norm.weightF32[6144]
-
blk.0.attn_k.weightQ4_K[6144 1024]
-
blk.0.attn_output.weightQ4_K[6144 6144]
-
blk.0.attn_q.weightQ4_K[6144 6144]
-
blk.0.attn_v.weightQ6_K[6144 1024]
-
blk.1.attn_norm.weightF32[6144]
-
blk.1.ffn_down.weightQ6_K[16384 6144]
-
blk.1.ffn_gate.weightQ4_K[6144 16384]
-
blk.1.ffn_up.weightQ4_K[6144 16384]
-
blk.1.ffn_norm.weightF32[6144]
-
blk.1.attn_k.weightQ4_K[6144 1024]
-
blk.1.attn_output.weightQ4_K[6144 6144]
-
blk.1.attn_q.weightQ4_K[6144 6144]
-
blk.1.attn_v.weightQ6_K[6144 1024]
-
blk.2.attn_norm.weightF32[6144]
-
blk.2.ffn_down.weightQ6_K[16384 6144]
-
blk.2.ffn_gate.weightQ4_K[6144 16384]
-
blk.2.ffn_up.weightQ4_K[6144 16384]
-
blk.2.ffn_norm.weightF32[6144]
-
blk.2.attn_k.weightQ4_K[6144 1024]
-
blk.2.attn_output.weightQ4_K[6144 6144]
-
blk.2.attn_q.weightQ4_K[6144 6144]
-
blk.2.attn_v.weightQ6_K[6144 1024]
-
blk.3.attn_norm.weightF32[6144]
-
blk.3.ffn_down.weightQ6_K[16384 6144]
-
blk.3.ffn_gate.weightQ4_K[6144 16384]
-
blk.3.ffn_up.weightQ4_K[6144 16384]
-
blk.3.ffn_norm.weightF32[6144]
-
blk.3.attn_k.weightQ4_K[6144 1024]
-
blk.3.attn_output.weightQ4_K[6144 6144]
-
blk.3.attn_q.weightQ4_K[6144 6144]
-
blk.3.attn_v.weightQ6_K[6144 1024]
-
blk.4.attn_norm.weightF32[6144]
-
blk.4.ffn_down.weightQ6_K[16384 6144]
-
blk.4.ffn_gate.weightQ4_K[6144 16384]
-
blk.4.ffn_up.weightQ4_K[6144 16384]
-
blk.4.ffn_norm.weightF32[6144]
-
blk.4.attn_k.weightQ4_K[6144 1024]
-
blk.4.attn_output.weightQ4_K[6144 6144]
-
blk.4.attn_q.weightQ4_K[6144 6144]
-
blk.4.attn_v.weightQ6_K[6144 1024]
-
blk.5.ffn_gate.weightQ4_K[6144 16384]
-
blk.5.ffn_up.weightQ4_K[6144 16384]
-
blk.5.attn_k.weightQ4_K[6144 1024]
-
blk.5.attn_output.weightQ4_K[6144 6144]
-
blk.5.attn_q.weightQ4_K[6144 6144]
-
blk.5.attn_v.weightQ6_K[6144 1024]
-
blk.5.attn_norm.weightF32[6144]
-
blk.5.ffn_down.weightQ4_K[16384 6144]
-
blk.5.ffn_norm.weightF32[6144]
-
blk.6.attn_norm.weightF32[6144]
-
blk.6.ffn_down.weightQ4_K[16384 6144]
-
blk.6.ffn_gate.weightQ4_K[6144 16384]
-
blk.6.ffn_up.weightQ4_K[6144 16384]
-
blk.6.ffn_norm.weightF32[6144]
-
blk.6.attn_k.weightQ4_K[6144 1024]
-
blk.6.attn_output.weightQ4_K[6144 6144]
-
blk.6.attn_q.weightQ4_K[6144 6144]
-
blk.6.attn_v.weightQ6_K[6144 1024]
-
blk.7.attn_norm.weightF32[6144]
-
blk.7.ffn_down.weightQ6_K[16384 6144]
-
blk.7.ffn_gate.weightQ4_K[6144 16384]
-
blk.7.ffn_up.weightQ4_K[6144 16384]
-
blk.7.ffn_norm.weightF32[6144]
-
blk.7.attn_k.weightQ4_K[6144 1024]
-
blk.7.attn_output.weightQ4_K[6144 6144]
-
blk.7.attn_q.weightQ4_K[6144 6144]
-
blk.7.attn_v.weightQ4_K[6144 1024]
-
blk.8.attn_norm.weightF32[6144]
-
blk.8.ffn_down.weightQ4_K[16384 6144]
-
blk.8.ffn_gate.weightQ4_K[6144 16384]
-
blk.8.ffn_up.weightQ4_K[6144 16384]
-
blk.8.ffn_norm.weightF32[6144]
-
blk.8.attn_k.weightQ4_K[6144 1024]
-
blk.8.attn_output.weightQ4_K[6144 6144]
-
blk.8.attn_q.weightQ4_K[6144 6144]
-
blk.8.attn_v.weightQ4_K[6144 1024]
-
blk.9.attn_norm.weightF32[6144]
-
blk.9.ffn_down.weightQ4_K[16384 6144]
-
blk.9.ffn_gate.weightQ4_K[6144 16384]
-
blk.9.ffn_up.weightQ4_K[6144 16384]
-
blk.9.ffn_norm.weightF32[6144]
-
blk.9.attn_k.weightQ4_K[6144 1024]
-
blk.9.attn_output.weightQ4_K[6144 6144]
-
blk.9.attn_q.weightQ4_K[6144 6144]
-
blk.9.attn_v.weightQ6_K[6144 1024]
-
blk.10.attn_norm.weightF32[6144]
-
blk.10.ffn_down.weightQ6_K[16384 6144]
-
blk.10.ffn_gate.weightQ4_K[6144 16384]
-
blk.10.ffn_up.weightQ4_K[6144 16384]
-
blk.10.ffn_norm.weightF32[6144]
-
blk.10.attn_k.weightQ4_K[6144 1024]
-
blk.10.attn_output.weightQ4_K[6144 6144]
-
blk.10.attn_q.weightQ4_K[6144 6144]
-
blk.10.attn_v.weightQ6_K[6144 1024]
-
blk.11.attn_norm.weightF32[6144]
-
blk.11.ffn_down.weightQ6_K[16384 6144]
-
blk.11.ffn_gate.weightQ4_K[6144 16384]
-
blk.11.ffn_up.weightQ4_K[6144 16384]
-
blk.11.ffn_norm.weightF32[6144]
-
blk.11.attn_k.weightQ4_K[6144 1024]
-
blk.11.attn_output.weightQ4_K[6144 6144]
-
blk.11.attn_q.weightQ4_K[6144 6144]
-
blk.11.attn_v.weightQ4_K[6144 1024]
-
blk.12.attn_k.weightQ4_K[6144 1024]
-
blk.12.attn_q.weightQ4_K[6144 6144]
-
blk.12.attn_v.weightQ4_K[6144 1024]
-
blk.12.attn_norm.weightF32[6144]
-
blk.12.ffn_down.weightQ6_K[16384 6144]
-
blk.12.ffn_gate.weightQ4_K[6144 16384]
-
blk.12.ffn_up.weightQ4_K[6144 16384]
-
blk.12.ffn_norm.weightF32[6144]
-
blk.12.attn_output.weightQ4_K[6144 6144]
-
blk.13.attn_norm.weightF32[6144]
-
blk.13.ffn_down.weightQ4_K[16384 6144]
-
blk.13.ffn_gate.weightQ4_K[6144 16384]
-
blk.13.ffn_up.weightQ4_K[6144 16384]
-
blk.13.ffn_norm.weightF32[6144]
-
blk.13.attn_k.weightQ4_K[6144 1024]
-
blk.13.attn_output.weightQ4_K[6144 6144]
-
blk.13.attn_q.weightQ4_K[6144 6144]
-
blk.13.attn_v.weightQ4_K[6144 1024]
-
blk.14.attn_norm.weightF32[6144]
-
blk.14.ffn_down.weightQ4_K[16384 6144]
-
blk.14.ffn_gate.weightQ4_K[6144 16384]
-
blk.14.ffn_up.weightQ4_K[6144 16384]
-
blk.14.ffn_norm.weightF32[6144]
-
blk.14.attn_k.weightQ4_K[6144 1024]
-
blk.14.attn_output.weightQ4_K[6144 6144]
-
blk.14.attn_q.weightQ4_K[6144 6144]
-
blk.14.attn_v.weightQ4_K[6144 1024]
-
blk.15.attn_norm.weightF32[6144]
-
blk.15.ffn_down.weightQ6_K[16384 6144]
-
blk.15.ffn_gate.weightQ4_K[6144 16384]
-
blk.15.ffn_up.weightQ4_K[6144 16384]
-
blk.15.ffn_norm.weightF32[6144]
-
blk.15.attn_k.weightQ4_K[6144 1024]
-
blk.15.attn_output.weightQ4_K[6144 6144]
-
blk.15.attn_q.weightQ4_K[6144 6144]
-
blk.15.attn_v.weightQ6_K[6144 1024]
-
blk.16.attn_norm.weightF32[6144]
-
blk.16.ffn_down.weightQ4_K[16384 6144]
-
blk.16.ffn_gate.weightQ4_K[6144 16384]
-
blk.16.ffn_up.weightQ4_K[6144 16384]
-
blk.16.ffn_norm.weightF32[6144]
-
blk.16.attn_k.weightQ4_K[6144 1024]
-
blk.16.attn_output.weightQ4_K[6144 6144]
-
blk.16.attn_q.weightQ4_K[6144 6144]
-
blk.16.attn_v.weightQ4_K[6144 1024]
-
blk.17.attn_norm.weightF32[6144]
-
blk.17.ffn_down.weightQ4_K[16384 6144]
-
blk.17.ffn_gate.weightQ4_K[6144 16384]
-
blk.17.ffn_up.weightQ4_K[6144 16384]
-
blk.17.ffn_norm.weightF32[6144]
-
blk.17.attn_k.weightQ4_K[6144 1024]
-
blk.17.attn_output.weightQ4_K[6144 6144]
-
blk.17.attn_q.weightQ4_K[6144 6144]
-
blk.17.attn_v.weightQ4_K[6144 1024]
-
blk.18.ffn_gate.weightQ4_K[6144 16384]
-
blk.18.attn_k.weightQ4_K[6144 1024]
-
blk.18.attn_output.weightQ4_K[6144 6144]
-
blk.18.attn_q.weightQ4_K[6144 6144]
-
blk.18.attn_v.weightQ6_K[6144 1024]
-
blk.18.attn_norm.weightF32[6144]
-
blk.18.ffn_down.weightQ6_K[16384 6144]
-
blk.18.ffn_up.weightQ4_K[6144 16384]
-
blk.18.ffn_norm.weightF32[6144]
-
blk.19.attn_norm.weightF32[6144]
-
blk.19.ffn_down.weightQ4_K[16384 6144]
-
blk.19.ffn_gate.weightQ4_K[6144 16384]
-
blk.19.ffn_up.weightQ4_K[6144 16384]
-
blk.19.ffn_norm.weightF32[6144]
-
blk.19.attn_k.weightQ4_K[6144 1024]
-
blk.19.attn_output.weightQ4_K[6144 6144]
-
blk.19.attn_q.weightQ4_K[6144 6144]
-
blk.19.attn_v.weightQ4_K[6144 1024]
-
blk.20.attn_norm.weightF32[6144]
-
blk.20.ffn_down.weightQ4_K[16384 6144]
-
blk.20.ffn_gate.weightQ4_K[6144 16384]
-
blk.20.ffn_up.weightQ4_K[6144 16384]
-
blk.20.ffn_norm.weightF32[6144]
-
blk.20.attn_k.weightQ4_K[6144 1024]
-
blk.20.attn_output.weightQ4_K[6144 6144]
-
blk.20.attn_q.weightQ4_K[6144 6144]
-
blk.20.attn_v.weightQ4_K[6144 1024]
-
blk.21.attn_norm.weightF32[6144]
-
blk.21.ffn_down.weightQ6_K[16384 6144]
-
blk.21.ffn_gate.weightQ4_K[6144 16384]
-
blk.21.ffn_up.weightQ4_K[6144 16384]
-
blk.21.ffn_norm.weightF32[6144]
-
blk.21.attn_k.weightQ4_K[6144 1024]
-
blk.21.attn_output.weightQ4_K[6144 6144]
-
blk.21.attn_q.weightQ4_K[6144 6144]
-
blk.21.attn_v.weightQ6_K[6144 1024]
-
blk.22.attn_norm.weightF32[6144]
-
blk.22.ffn_down.weightQ4_K[16384 6144]
-
blk.22.ffn_gate.weightQ4_K[6144 16384]
-
blk.22.ffn_up.weightQ4_K[6144 16384]
-
blk.22.ffn_norm.weightF32[6144]
-
blk.22.attn_k.weightQ4_K[6144 1024]
-
blk.22.attn_output.weightQ4_K[6144 6144]
-
blk.22.attn_q.weightQ4_K[6144 6144]
-
blk.22.attn_v.weightQ4_K[6144 1024]
-
blk.23.attn_norm.weightF32[6144]
-
blk.23.ffn_down.weightQ4_K[16384 6144]
-
blk.23.ffn_gate.weightQ4_K[6144 16384]
-
blk.23.ffn_up.weightQ4_K[6144 16384]
-
blk.23.ffn_norm.weightF32[6144]
-
blk.23.attn_k.weightQ4_K[6144 1024]
-
blk.23.attn_output.weightQ4_K[6144 6144]
-
blk.23.attn_q.weightQ4_K[6144 6144]
-
blk.23.attn_v.weightQ4_K[6144 1024]
-
blk.24.ffn_gate.weightQ4_K[6144 16384]
-
blk.24.ffn_up.weightQ4_K[6144 16384]
-
blk.24.attn_k.weightQ4_K[6144 1024]
-
blk.24.attn_output.weightQ4_K[6144 6144]
-
blk.24.attn_q.weightQ4_K[6144 6144]
-
blk.24.attn_v.weightQ6_K[6144 1024]
-
blk.24.attn_norm.weightF32[6144]
-
blk.24.ffn_down.weightQ6_K[16384 6144]
-
blk.24.ffn_norm.weightF32[6144]
-
blk.25.attn_norm.weightF32[6144]
-
blk.25.ffn_down.weightQ4_K[16384 6144]
-
blk.25.ffn_gate.weightQ4_K[6144 16384]
-
blk.25.ffn_up.weightQ4_K[6144 16384]
-
blk.25.ffn_norm.weightF32[6144]
-
blk.25.attn_k.weightQ4_K[6144 1024]
-
blk.25.attn_output.weightQ4_K[6144 6144]
-
blk.25.attn_q.weightQ4_K[6144 6144]
-
blk.25.attn_v.weightQ4_K[6144 1024]
-
blk.26.attn_norm.weightF32[6144]
-
blk.26.ffn_down.weightQ4_K[16384 6144]
-
blk.26.ffn_gate.weightQ4_K[6144 16384]
-
blk.26.ffn_up.weightQ4_K[6144 16384]
-
blk.26.ffn_norm.weightF32[6144]
-
blk.26.attn_k.weightQ4_K[6144 1024]
-
blk.26.attn_output.weightQ4_K[6144 6144]
-
blk.26.attn_q.weightQ4_K[6144 6144]
-
blk.26.attn_v.weightQ4_K[6144 1024]
-
blk.27.attn_norm.weightF32[6144]
-
blk.27.ffn_down.weightQ6_K[16384 6144]
-
blk.27.ffn_gate.weightQ4_K[6144 16384]
-
blk.27.ffn_up.weightQ4_K[6144 16384]
-
blk.27.ffn_norm.weightF32[6144]
-
blk.27.attn_k.weightQ4_K[6144 1024]
-
blk.27.attn_output.weightQ4_K[6144 6144]
-
blk.27.attn_q.weightQ4_K[6144 6144]
-
blk.27.attn_v.weightQ6_K[6144 1024]
-
blk.28.attn_norm.weightF32[6144]
-
blk.28.ffn_down.weightQ4_K[16384 6144]
-
blk.28.ffn_gate.weightQ4_K[6144 16384]
-
blk.28.ffn_up.weightQ4_K[6144 16384]
-
blk.28.ffn_norm.weightF32[6144]
-
blk.28.attn_k.weightQ4_K[6144 1024]
-
blk.28.attn_output.weightQ4_K[6144 6144]
-
blk.28.attn_q.weightQ4_K[6144 6144]
-
blk.28.attn_v.weightQ4_K[6144 1024]
-
blk.29.attn_norm.weightF32[6144]
-
blk.29.ffn_down.weightQ4_K[16384 6144]
-
blk.29.ffn_gate.weightQ4_K[6144 16384]
-
blk.29.ffn_up.weightQ4_K[6144 16384]
-
blk.29.ffn_norm.weightF32[6144]
-
blk.29.attn_k.weightQ4_K[6144 1024]
-
blk.29.attn_output.weightQ4_K[6144 6144]
-
blk.29.attn_q.weightQ4_K[6144 6144]
-
blk.29.attn_v.weightQ4_K[6144 1024]
-
blk.30.attn_norm.weightF32[6144]
-
blk.30.ffn_down.weightQ6_K[16384 6144]
-
blk.30.ffn_gate.weightQ4_K[6144 16384]
-
blk.30.ffn_up.weightQ4_K[6144 16384]
-
blk.30.ffn_norm.weightF32[6144]
-
blk.30.attn_k.weightQ4_K[6144 1024]
-
blk.30.attn_output.weightQ4_K[6144 6144]
-
blk.30.attn_q.weightQ4_K[6144 6144]
-
blk.30.attn_v.weightQ6_K[6144 1024]
-
blk.31.attn_k.weightQ4_K[6144 1024]
-
blk.31.attn_q.weightQ4_K[6144 6144]
-
blk.31.attn_v.weightQ4_K[6144 1024]
-
blk.31.attn_norm.weightF32[6144]
-
blk.31.ffn_down.weightQ4_K[16384 6144]
-
blk.31.ffn_gate.weightQ4_K[6144 16384]
-
blk.31.ffn_up.weightQ4_K[6144 16384]
-
blk.31.ffn_norm.weightF32[6144]
-
blk.31.attn_output.weightQ4_K[6144 6144]
-
blk.32.attn_norm.weightF32[6144]
-
blk.32.ffn_down.weightQ4_K[16384 6144]
-
blk.32.ffn_gate.weightQ4_K[6144 16384]
-
blk.32.ffn_up.weightQ4_K[6144 16384]
-
blk.32.ffn_norm.weightF32[6144]
-
blk.32.attn_k.weightQ4_K[6144 1024]
-
blk.32.attn_output.weightQ4_K[6144 6144]
-
blk.32.attn_q.weightQ4_K[6144 6144]
-
blk.32.attn_v.weightQ4_K[6144 1024]
-
blk.33.attn_norm.weightF32[6144]
-
blk.33.ffn_down.weightQ6_K[16384 6144]
-
blk.33.ffn_gate.weightQ4_K[6144 16384]
-
blk.33.ffn_up.weightQ4_K[6144 16384]
-
blk.33.ffn_norm.weightF32[6144]
-
blk.33.attn_k.weightQ4_K[6144 1024]
-
blk.33.attn_output.weightQ4_K[6144 6144]
-
blk.33.attn_q.weightQ4_K[6144 6144]
-
blk.33.attn_v.weightQ6_K[6144 1024]
-
blk.34.attn_norm.weightF32[6144]
-
blk.34.ffn_down.weightQ4_K[16384 6144]
-
blk.34.ffn_gate.weightQ4_K[6144 16384]
-
blk.34.ffn_up.weightQ4_K[6144 16384]
-
blk.34.ffn_norm.weightF32[6144]
-
blk.34.attn_k.weightQ4_K[6144 1024]
-
blk.34.attn_output.weightQ4_K[6144 6144]
-
blk.34.attn_q.weightQ4_K[6144 6144]
-
blk.34.attn_v.weightQ4_K[6144 1024]
-
blk.35.attn_norm.weightF32[6144]
-
blk.35.ffn_down.weightQ4_K[16384 6144]
-
blk.35.ffn_gate.weightQ4_K[6144 16384]
-
blk.35.ffn_up.weightQ4_K[6144 16384]
-
blk.35.ffn_norm.weightF32[6144]
-
blk.35.attn_k.weightQ4_K[6144 1024]
-
blk.35.attn_output.weightQ4_K[6144 6144]
-
blk.35.attn_q.weightQ4_K[6144 6144]
-
blk.35.attn_v.weightQ4_K[6144 1024]
-
blk.36.attn_norm.weightF32[6144]
-
blk.36.ffn_down.weightQ6_K[16384 6144]
-
blk.36.ffn_gate.weightQ4_K[6144 16384]
-
blk.36.ffn_up.weightQ4_K[6144 16384]
-
blk.36.ffn_norm.weightF32[6144]
-
blk.36.attn_k.weightQ4_K[6144 1024]
-
blk.36.attn_output.weightQ4_K[6144 6144]
-
blk.36.attn_q.weightQ4_K[6144 6144]
-
blk.36.attn_v.weightQ6_K[6144 1024]
-
blk.37.ffn_gate.weightQ4_K[6144 16384]
-
blk.37.attn_k.weightQ4_K[6144 1024]
-
blk.37.attn_output.weightQ4_K[6144 6144]
-
blk.37.attn_q.weightQ4_K[6144 6144]
-
blk.37.attn_v.weightQ4_K[6144 1024]
-
blk.37.attn_norm.weightF32[6144]
-
blk.37.ffn_down.weightQ4_K[16384 6144]
-
blk.37.ffn_up.weightQ4_K[6144 16384]
-
blk.37.ffn_norm.weightF32[6144]
-
blk.38.attn_norm.weightF32[6144]
-
blk.38.ffn_down.weightQ4_K[16384 6144]
-
blk.38.ffn_gate.weightQ4_K[6144 16384]
-
blk.38.ffn_up.weightQ4_K[6144 16384]
-
blk.38.ffn_norm.weightF32[6144]
-
blk.38.attn_k.weightQ4_K[6144 1024]
-
blk.38.attn_output.weightQ4_K[6144 6144]
-
blk.38.attn_q.weightQ4_K[6144 6144]
-
blk.38.attn_v.weightQ4_K[6144 1024]
-
blk.39.attn_norm.weightF32[6144]
-
blk.39.ffn_down.weightQ6_K[16384 6144]
-
blk.39.ffn_gate.weightQ4_K[6144 16384]
-
blk.39.ffn_up.weightQ4_K[6144 16384]
-
blk.39.ffn_norm.weightF32[6144]
-
blk.39.attn_k.weightQ4_K[6144 1024]
-
blk.39.attn_output.weightQ4_K[6144 6144]
-
blk.39.attn_q.weightQ4_K[6144 6144]
-
blk.39.attn_v.weightQ6_K[6144 1024]
-
blk.40.attn_norm.weightF32[6144]
-
blk.40.ffn_down.weightQ4_K[16384 6144]
-
blk.40.ffn_gate.weightQ4_K[6144 16384]
-
blk.40.ffn_up.weightQ4_K[6144 16384]
-
blk.40.ffn_norm.weightF32[6144]
-
blk.40.attn_k.weightQ4_K[6144 1024]
-
blk.40.attn_output.weightQ4_K[6144 6144]
-
blk.40.attn_q.weightQ4_K[6144 6144]
-
blk.40.attn_v.weightQ4_K[6144 1024]
-
blk.41.attn_norm.weightF32[6144]
-
blk.41.ffn_down.weightQ4_K[16384 6144]
-
blk.41.ffn_gate.weightQ4_K[6144 16384]
-
blk.41.ffn_up.weightQ4_K[6144 16384]
-
blk.41.ffn_norm.weightF32[6144]
-
blk.41.attn_k.weightQ4_K[6144 1024]
-
blk.41.attn_output.weightQ4_K[6144 6144]
-
blk.41.attn_q.weightQ4_K[6144 6144]
-
blk.41.attn_v.weightQ4_K[6144 1024]
-
blk.42.attn_norm.weightF32[6144]
-
blk.42.ffn_down.weightQ6_K[16384 6144]
-
blk.42.ffn_gate.weightQ4_K[6144 16384]
-
blk.42.ffn_up.weightQ4_K[6144 16384]
-
blk.42.ffn_norm.weightF32[6144]
-
blk.42.attn_k.weightQ4_K[6144 1024]
-
blk.42.attn_output.weightQ4_K[6144 6144]
-
blk.42.attn_q.weightQ4_K[6144 6144]
-
blk.42.attn_v.weightQ6_K[6144 1024]
-
blk.43.ffn_gate.weightQ4_K[6144 16384]
-
blk.43.ffn_up.weightQ4_K[6144 16384]
-
blk.43.attn_k.weightQ4_K[6144 1024]
-
blk.43.attn_output.weightQ4_K[6144 6144]
-
blk.43.attn_q.weightQ4_K[6144 6144]
-
blk.43.attn_v.weightQ4_K[6144 1024]
-
blk.43.attn_norm.weightF32[6144]
-
blk.43.ffn_down.weightQ4_K[16384 6144]
-
blk.43.ffn_norm.weightF32[6144]
-
blk.44.attn_norm.weightF32[6144]
-
blk.44.ffn_down.weightQ4_K[16384 6144]
-
blk.44.ffn_gate.weightQ4_K[6144 16384]
-
blk.44.ffn_up.weightQ4_K[6144 16384]
-
blk.44.ffn_norm.weightF32[6144]
-
blk.44.attn_k.weightQ4_K[6144 1024]
-
blk.44.attn_output.weightQ4_K[6144 6144]
-
blk.44.attn_q.weightQ4_K[6144 6144]
-
blk.44.attn_v.weightQ4_K[6144 1024]
-
blk.45.attn_norm.weightF32[6144]
-
blk.45.ffn_down.weightQ6_K[16384 6144]
-
blk.45.ffn_gate.weightQ4_K[6144 16384]
-
blk.45.ffn_up.weightQ4_K[6144 16384]
-
blk.45.ffn_norm.weightF32[6144]
-
blk.45.attn_k.weightQ4_K[6144 1024]
-
blk.45.attn_output.weightQ4_K[6144 6144]
-
blk.45.attn_q.weightQ4_K[6144 6144]
-
blk.45.attn_v.weightQ6_K[6144 1024]
-
blk.46.attn_norm.weightF32[6144]
-
blk.46.ffn_down.weightQ4_K[16384 6144]
-
blk.46.ffn_gate.weightQ4_K[6144 16384]
-
blk.46.ffn_up.weightQ4_K[6144 16384]
-
blk.46.ffn_norm.weightF32[6144]
-
blk.46.attn_k.weightQ4_K[6144 1024]
-
blk.46.attn_output.weightQ4_K[6144 6144]
-
blk.46.attn_q.weightQ4_K[6144 6144]
-
blk.46.attn_v.weightQ4_K[6144 1024]
-
blk.47.attn_norm.weightF32[6144]
-
blk.47.ffn_down.weightQ4_K[16384 6144]
-
blk.47.ffn_gate.weightQ4_K[6144 16384]
-
blk.47.ffn_up.weightQ4_K[6144 16384]
-
blk.47.ffn_norm.weightF32[6144]
-
blk.47.attn_k.weightQ4_K[6144 1024]
-
blk.47.attn_output.weightQ4_K[6144 6144]
-
blk.47.attn_q.weightQ4_K[6144 6144]
-
blk.47.attn_v.weightQ4_K[6144 1024]
-
blk.48.attn_norm.weightF32[6144]
-
blk.48.ffn_down.weightQ6_K[16384 6144]
-
blk.48.ffn_gate.weightQ4_K[6144 16384]
-
blk.48.ffn_up.weightQ4_K[6144 16384]
-
blk.48.ffn_norm.weightF32[6144]
-
blk.48.attn_k.weightQ4_K[6144 1024]
-
blk.48.attn_output.weightQ4_K[6144 6144]
-
blk.48.attn_q.weightQ4_K[6144 6144]
-
blk.48.attn_v.weightQ6_K[6144 1024]
-
blk.49.attn_norm.weightF32[6144]
-
blk.49.ffn_down.weightQ6_K[16384 6144]
-
blk.49.ffn_gate.weightQ4_K[6144 16384]
-
blk.49.ffn_up.weightQ4_K[6144 16384]
-
blk.49.ffn_norm.weightF32[6144]
-
blk.49.attn_k.weightQ4_K[6144 1024]
-
blk.49.attn_output.weightQ4_K[6144 6144]
-
blk.49.attn_q.weightQ4_K[6144 6144]
-
blk.49.attn_v.weightQ6_K[6144 1024]
-
blk.50.attn_k.weightQ4_K[6144 1024]
-
blk.50.attn_q.weightQ4_K[6144 6144]
-
blk.50.attn_v.weightQ6_K[6144 1024]
-
blk.50.attn_norm.weightF32[6144]
-
blk.50.ffn_down.weightQ6_K[16384 6144]
-
blk.50.ffn_gate.weightQ4_K[6144 16384]
-
blk.50.ffn_up.weightQ4_K[6144 16384]
-
blk.50.ffn_norm.weightF32[6144]
-
blk.50.attn_output.weightQ4_K[6144 6144]
-
blk.51.attn_norm.weightF32[6144]
-
blk.51.ffn_down.weightQ6_K[16384 6144]
-
blk.51.ffn_gate.weightQ4_K[6144 16384]
-
blk.51.ffn_up.weightQ4_K[6144 16384]
-
blk.51.ffn_norm.weightF32[6144]
-
blk.51.attn_k.weightQ4_K[6144 1024]
-
blk.51.attn_output.weightQ4_K[6144 6144]
-
blk.51.attn_q.weightQ4_K[6144 6144]
-
blk.51.attn_v.weightQ6_K[6144 1024]
-
blk.52.attn_norm.weightF32[6144]
-
blk.52.ffn_down.weightQ6_K[16384 6144]
-
blk.52.ffn_gate.weightQ4_K[6144 16384]
-
blk.52.ffn_up.weightQ4_K[6144 16384]
-
blk.52.ffn_norm.weightF32[6144]
-
blk.52.attn_k.weightQ4_K[6144 1024]
-
blk.52.attn_output.weightQ4_K[6144 6144]
-
blk.52.attn_q.weightQ4_K[6144 6144]
-
blk.52.attn_v.weightQ6_K[6144 1024]
-
blk.53.attn_norm.weightF32[6144]
-
blk.53.ffn_down.weightQ6_K[16384 6144]
-
blk.53.ffn_gate.weightQ4_K[6144 16384]
-
blk.53.ffn_up.weightQ4_K[6144 16384]
-
blk.53.ffn_norm.weightF32[6144]
-
blk.53.attn_k.weightQ4_K[6144 1024]
-
blk.53.attn_output.weightQ4_K[6144 6144]
-
blk.53.attn_q.weightQ4_K[6144 6144]
-
blk.53.attn_v.weightQ6_K[6144 1024]
-
blk.54.attn_norm.weightF32[6144]
-
blk.54.ffn_down.weightQ6_K[16384 6144]
-
blk.54.ffn_gate.weightQ4_K[6144 16384]
-
blk.54.ffn_up.weightQ4_K[6144 16384]
-
blk.54.ffn_norm.weightF32[6144]
-
blk.54.attn_k.weightQ4_K[6144 1024]
-
blk.54.attn_output.weightQ4_K[6144 6144]
-
blk.54.attn_q.weightQ4_K[6144 6144]
-
blk.54.attn_v.weightQ6_K[6144 1024]
-
blk.55.attn_norm.weightF32[6144]
-
blk.55.ffn_down.weightQ6_K[16384 6144]
-
blk.55.ffn_gate.weightQ4_K[6144 16384]
-
blk.55.ffn_up.weightQ4_K[6144 16384]
-
blk.55.ffn_norm.weightF32[6144]
-
blk.55.attn_k.weightQ4_K[6144 1024]
-
blk.55.attn_output.weightQ4_K[6144 6144]
-
blk.55.attn_q.weightQ4_K[6144 6144]
-
blk.55.attn_v.weightQ6_K[6144 1024]
-
output.weightQ6_K[6144 32771]
-
output_norm.weightF32[6144]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55