Codelama with 16k context unlocked in modelfile
13B
34B
173 Pulls Updated 10 months ago
ff10def5e6be · 16GB
-
general.architecturellama
-
general.file_typeQ3_K_M
-
llama.attention.head_count64
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count48
-
llama.context_length16384
-
llama.embedding_length8192
-
llama.feed_forward_length22016
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+06
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[2 3 3 6 6 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> <0x00> <0x01> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ3_K[8192 32000]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.ffn_down.weightQ5_K[22016 8192]
-
blk.0.ffn_gate.weightQ3_K[8192 22016]
-
blk.0.ffn_up.weightQ3_K[8192 22016]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.attn_k.weightQ3_K[8192 1024]
-
blk.0.attn_output.weightQ4_K[8192 8192]
-
blk.0.attn_q.weightQ3_K[8192 8192]
-
blk.0.attn_v.weightQ5_K[8192 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.ffn_down.weightQ5_K[22016 8192]
-
blk.1.ffn_gate.weightQ3_K[8192 22016]
-
blk.1.ffn_up.weightQ3_K[8192 22016]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.1.attn_k.weightQ3_K[8192 1024]
-
blk.1.attn_output.weightQ4_K[8192 8192]
-
blk.1.attn_q.weightQ3_K[8192 8192]
-
blk.1.attn_v.weightQ5_K[8192 1024]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.ffn_down.weightQ4_K[22016 8192]
-
blk.2.ffn_gate.weightQ3_K[8192 22016]
-
blk.2.ffn_up.weightQ3_K[8192 22016]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.2.attn_k.weightQ3_K[8192 1024]
-
blk.2.attn_output.weightQ4_K[8192 8192]
-
blk.2.attn_q.weightQ3_K[8192 8192]
-
blk.2.attn_v.weightQ4_K[8192 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.ffn_down.weightQ4_K[22016 8192]
-
blk.3.ffn_gate.weightQ3_K[8192 22016]
-
blk.3.ffn_up.weightQ3_K[8192 22016]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.3.attn_k.weightQ3_K[8192 1024]
-
blk.3.attn_output.weightQ4_K[8192 8192]
-
blk.3.attn_q.weightQ3_K[8192 8192]
-
blk.3.attn_v.weightQ4_K[8192 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.ffn_down.weightQ4_K[22016 8192]
-
blk.4.ffn_gate.weightQ3_K[8192 22016]
-
blk.4.ffn_up.weightQ3_K[8192 22016]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.4.attn_k.weightQ3_K[8192 1024]
-
blk.4.attn_output.weightQ4_K[8192 8192]
-
blk.4.attn_q.weightQ3_K[8192 8192]
-
blk.4.attn_v.weightQ4_K[8192 1024]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.ffn_down.weightQ4_K[22016 8192]
-
blk.5.ffn_gate.weightQ3_K[8192 22016]
-
blk.5.ffn_up.weightQ3_K[8192 22016]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.5.attn_k.weightQ3_K[8192 1024]
-
blk.5.attn_output.weightQ4_K[8192 8192]
-
blk.5.attn_q.weightQ3_K[8192 8192]
-
blk.5.attn_v.weightQ4_K[8192 1024]
-
blk.6.ffn_gate.weightQ3_K[8192 22016]
-
blk.6.ffn_up.weightQ3_K[8192 22016]
-
blk.6.attn_k.weightQ3_K[8192 1024]
-
blk.6.attn_output.weightQ4_K[8192 8192]
-
blk.6.attn_q.weightQ3_K[8192 8192]
-
blk.6.attn_v.weightQ4_K[8192 1024]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.ffn_down.weightQ4_K[22016 8192]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.ffn_down.weightQ4_K[22016 8192]
-
blk.7.ffn_gate.weightQ3_K[8192 22016]
-
blk.7.ffn_up.weightQ3_K[8192 22016]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.7.attn_k.weightQ3_K[8192 1024]
-
blk.7.attn_output.weightQ4_K[8192 8192]
-
blk.7.attn_q.weightQ3_K[8192 8192]
-
blk.7.attn_v.weightQ4_K[8192 1024]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.ffn_down.weightQ4_K[22016 8192]
-
blk.8.ffn_gate.weightQ3_K[8192 22016]
-
blk.8.ffn_up.weightQ3_K[8192 22016]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.attn_k.weightQ3_K[8192 1024]
-
blk.8.attn_output.weightQ4_K[8192 8192]
-
blk.8.attn_q.weightQ3_K[8192 8192]
-
blk.8.attn_v.weightQ4_K[8192 1024]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.ffn_down.weightQ4_K[22016 8192]
-
blk.9.ffn_gate.weightQ3_K[8192 22016]
-
blk.9.ffn_up.weightQ3_K[8192 22016]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.attn_k.weightQ3_K[8192 1024]
-
blk.9.attn_output.weightQ4_K[8192 8192]
-
blk.9.attn_q.weightQ3_K[8192 8192]
-
blk.9.attn_v.weightQ4_K[8192 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.ffn_down.weightQ4_K[22016 8192]
-
blk.10.ffn_gate.weightQ3_K[8192 22016]
-
blk.10.ffn_up.weightQ3_K[8192 22016]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.10.attn_k.weightQ3_K[8192 1024]
-
blk.10.attn_output.weightQ4_K[8192 8192]
-
blk.10.attn_q.weightQ3_K[8192 8192]
-
blk.10.attn_v.weightQ4_K[8192 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.ffn_down.weightQ4_K[22016 8192]
-
blk.11.ffn_gate.weightQ3_K[8192 22016]
-
blk.11.ffn_up.weightQ3_K[8192 22016]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.11.attn_k.weightQ3_K[8192 1024]
-
blk.11.attn_output.weightQ4_K[8192 8192]
-
blk.11.attn_q.weightQ3_K[8192 8192]
-
blk.11.attn_v.weightQ4_K[8192 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.ffn_down.weightQ4_K[22016 8192]
-
blk.12.ffn_gate.weightQ3_K[8192 22016]
-
blk.12.ffn_up.weightQ3_K[8192 22016]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.12.attn_k.weightQ3_K[8192 1024]
-
blk.12.attn_output.weightQ4_K[8192 8192]
-
blk.12.attn_q.weightQ3_K[8192 8192]
-
blk.12.attn_v.weightQ4_K[8192 1024]
-
blk.13.ffn_gate.weightQ3_K[8192 22016]
-
blk.13.ffn_up.weightQ3_K[8192 22016]
-
blk.13.attn_k.weightQ3_K[8192 1024]
-
blk.13.attn_output.weightQ4_K[8192 8192]
-
blk.13.attn_q.weightQ3_K[8192 8192]
-
blk.13.attn_v.weightQ4_K[8192 1024]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.ffn_down.weightQ4_K[22016 8192]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.ffn_down.weightQ4_K[22016 8192]
-
blk.14.ffn_gate.weightQ3_K[8192 22016]
-
blk.14.ffn_up.weightQ3_K[8192 22016]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.14.attn_k.weightQ3_K[8192 1024]
-
blk.14.attn_output.weightQ4_K[8192 8192]
-
blk.14.attn_q.weightQ3_K[8192 8192]
-
blk.14.attn_v.weightQ4_K[8192 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.ffn_down.weightQ4_K[22016 8192]
-
blk.15.ffn_gate.weightQ3_K[8192 22016]
-
blk.15.ffn_up.weightQ3_K[8192 22016]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.15.attn_k.weightQ3_K[8192 1024]
-
blk.15.attn_output.weightQ4_K[8192 8192]
-
blk.15.attn_q.weightQ3_K[8192 8192]
-
blk.15.attn_v.weightQ4_K[8192 1024]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.ffn_down.weightQ4_K[22016 8192]
-
blk.16.ffn_gate.weightQ3_K[8192 22016]
-
blk.16.ffn_up.weightQ3_K[8192 22016]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.16.attn_k.weightQ3_K[8192 1024]
-
blk.16.attn_output.weightQ4_K[8192 8192]
-
blk.16.attn_q.weightQ3_K[8192 8192]
-
blk.16.attn_v.weightQ4_K[8192 1024]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.ffn_down.weightQ4_K[22016 8192]
-
blk.17.ffn_gate.weightQ3_K[8192 22016]
-
blk.17.ffn_up.weightQ3_K[8192 22016]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.17.attn_k.weightQ3_K[8192 1024]
-
blk.17.attn_output.weightQ4_K[8192 8192]
-
blk.17.attn_q.weightQ3_K[8192 8192]
-
blk.17.attn_v.weightQ4_K[8192 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.ffn_down.weightQ4_K[22016 8192]
-
blk.18.ffn_gate.weightQ3_K[8192 22016]
-
blk.18.ffn_up.weightQ3_K[8192 22016]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.18.attn_k.weightQ3_K[8192 1024]
-
blk.18.attn_output.weightQ4_K[8192 8192]
-
blk.18.attn_q.weightQ3_K[8192 8192]
-
blk.18.attn_v.weightQ4_K[8192 1024]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.ffn_down.weightQ4_K[22016 8192]
-
blk.19.ffn_gate.weightQ3_K[8192 22016]
-
blk.19.ffn_up.weightQ3_K[8192 22016]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.19.attn_k.weightQ3_K[8192 1024]
-
blk.19.attn_output.weightQ4_K[8192 8192]
-
blk.19.attn_q.weightQ3_K[8192 8192]
-
blk.19.attn_v.weightQ4_K[8192 1024]
-
blk.20.ffn_gate.weightQ3_K[8192 22016]
-
blk.20.ffn_up.weightQ3_K[8192 22016]
-
blk.20.attn_k.weightQ3_K[8192 1024]
-
blk.20.attn_output.weightQ4_K[8192 8192]
-
blk.20.attn_q.weightQ3_K[8192 8192]
-
blk.20.attn_v.weightQ4_K[8192 1024]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.ffn_down.weightQ4_K[22016 8192]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.ffn_down.weightQ4_K[22016 8192]
-
blk.21.ffn_gate.weightQ3_K[8192 22016]
-
blk.21.ffn_up.weightQ3_K[8192 22016]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.attn_k.weightQ3_K[8192 1024]
-
blk.21.attn_output.weightQ4_K[8192 8192]
-
blk.21.attn_q.weightQ3_K[8192 8192]
-
blk.21.attn_v.weightQ4_K[8192 1024]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.ffn_down.weightQ4_K[22016 8192]
-
blk.22.ffn_gate.weightQ3_K[8192 22016]
-
blk.22.ffn_up.weightQ3_K[8192 22016]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.22.attn_k.weightQ3_K[8192 1024]
-
blk.22.attn_output.weightQ4_K[8192 8192]
-
blk.22.attn_q.weightQ3_K[8192 8192]
-
blk.22.attn_v.weightQ4_K[8192 1024]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.ffn_down.weightQ4_K[22016 8192]
-
blk.23.ffn_gate.weightQ3_K[8192 22016]
-
blk.23.ffn_up.weightQ3_K[8192 22016]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.23.attn_k.weightQ3_K[8192 1024]
-
blk.23.attn_output.weightQ4_K[8192 8192]
-
blk.23.attn_q.weightQ3_K[8192 8192]
-
blk.23.attn_v.weightQ4_K[8192 1024]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.ffn_down.weightQ4_K[22016 8192]
-
blk.24.ffn_gate.weightQ3_K[8192 22016]
-
blk.24.ffn_up.weightQ3_K[8192 22016]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.attn_k.weightQ3_K[8192 1024]
-
blk.24.attn_output.weightQ4_K[8192 8192]
-
blk.24.attn_q.weightQ3_K[8192 8192]
-
blk.24.attn_v.weightQ4_K[8192 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.ffn_down.weightQ4_K[22016 8192]
-
blk.25.ffn_gate.weightQ3_K[8192 22016]
-
blk.25.ffn_up.weightQ3_K[8192 22016]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.attn_k.weightQ3_K[8192 1024]
-
blk.25.attn_output.weightQ4_K[8192 8192]
-
blk.25.attn_q.weightQ3_K[8192 8192]
-
blk.25.attn_v.weightQ4_K[8192 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.ffn_down.weightQ4_K[22016 8192]
-
blk.26.ffn_gate.weightQ3_K[8192 22016]
-
blk.26.ffn_up.weightQ3_K[8192 22016]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.26.attn_k.weightQ3_K[8192 1024]
-
blk.26.attn_output.weightQ4_K[8192 8192]
-
blk.26.attn_q.weightQ3_K[8192 8192]
-
blk.26.attn_v.weightQ4_K[8192 1024]
-
blk.27.ffn_gate.weightQ3_K[8192 22016]
-
blk.27.ffn_up.weightQ3_K[8192 22016]
-
blk.27.attn_k.weightQ3_K[8192 1024]
-
blk.27.attn_output.weightQ4_K[8192 8192]
-
blk.27.attn_q.weightQ3_K[8192 8192]
-
blk.27.attn_v.weightQ4_K[8192 1024]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.ffn_down.weightQ4_K[22016 8192]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.ffn_down.weightQ4_K[22016 8192]
-
blk.28.ffn_gate.weightQ3_K[8192 22016]
-
blk.28.ffn_up.weightQ3_K[8192 22016]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.attn_k.weightQ3_K[8192 1024]
-
blk.28.attn_output.weightQ4_K[8192 8192]
-
blk.28.attn_q.weightQ3_K[8192 8192]
-
blk.28.attn_v.weightQ4_K[8192 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.ffn_down.weightQ4_K[22016 8192]
-
blk.29.ffn_gate.weightQ3_K[8192 22016]
-
blk.29.ffn_up.weightQ3_K[8192 22016]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.29.attn_k.weightQ3_K[8192 1024]
-
blk.29.attn_output.weightQ4_K[8192 8192]
-
blk.29.attn_q.weightQ3_K[8192 8192]
-
blk.29.attn_v.weightQ4_K[8192 1024]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.ffn_down.weightQ4_K[22016 8192]
-
blk.30.ffn_gate.weightQ3_K[8192 22016]
-
blk.30.ffn_up.weightQ3_K[8192 22016]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.30.attn_k.weightQ3_K[8192 1024]
-
blk.30.attn_output.weightQ4_K[8192 8192]
-
blk.30.attn_q.weightQ3_K[8192 8192]
-
blk.30.attn_v.weightQ4_K[8192 1024]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.ffn_down.weightQ4_K[22016 8192]
-
blk.31.ffn_gate.weightQ3_K[8192 22016]
-
blk.31.ffn_up.weightQ3_K[8192 22016]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.31.attn_k.weightQ3_K[8192 1024]
-
blk.31.attn_output.weightQ4_K[8192 8192]
-
blk.31.attn_q.weightQ3_K[8192 8192]
-
blk.31.attn_v.weightQ4_K[8192 1024]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.ffn_down.weightQ4_K[22016 8192]
-
blk.32.ffn_gate.weightQ3_K[8192 22016]
-
blk.32.ffn_up.weightQ3_K[8192 22016]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.32.attn_k.weightQ3_K[8192 1024]
-
blk.32.attn_output.weightQ4_K[8192 8192]
-
blk.32.attn_q.weightQ3_K[8192 8192]
-
blk.32.attn_v.weightQ4_K[8192 1024]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.ffn_down.weightQ4_K[22016 8192]
-
blk.33.ffn_gate.weightQ3_K[8192 22016]
-
blk.33.ffn_up.weightQ3_K[8192 22016]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.33.attn_k.weightQ3_K[8192 1024]
-
blk.33.attn_output.weightQ4_K[8192 8192]
-
blk.33.attn_q.weightQ3_K[8192 8192]
-
blk.33.attn_v.weightQ4_K[8192 1024]
-
blk.34.ffn_gate.weightQ3_K[8192 22016]
-
blk.34.ffn_up.weightQ3_K[8192 22016]
-
blk.34.attn_k.weightQ3_K[8192 1024]
-
blk.34.attn_output.weightQ4_K[8192 8192]
-
blk.34.attn_q.weightQ3_K[8192 8192]
-
blk.34.attn_v.weightQ4_K[8192 1024]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.ffn_down.weightQ4_K[22016 8192]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.ffn_down.weightQ4_K[22016 8192]
-
blk.35.ffn_gate.weightQ3_K[8192 22016]
-
blk.35.ffn_up.weightQ3_K[8192 22016]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.35.attn_k.weightQ3_K[8192 1024]
-
blk.35.attn_output.weightQ4_K[8192 8192]
-
blk.35.attn_q.weightQ3_K[8192 8192]
-
blk.35.attn_v.weightQ4_K[8192 1024]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.ffn_down.weightQ4_K[22016 8192]
-
blk.36.ffn_gate.weightQ3_K[8192 22016]
-
blk.36.ffn_up.weightQ3_K[8192 22016]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.attn_k.weightQ3_K[8192 1024]
-
blk.36.attn_output.weightQ4_K[8192 8192]
-
blk.36.attn_q.weightQ3_K[8192 8192]
-
blk.36.attn_v.weightQ4_K[8192 1024]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.ffn_down.weightQ4_K[22016 8192]
-
blk.37.ffn_gate.weightQ3_K[8192 22016]
-
blk.37.ffn_up.weightQ3_K[8192 22016]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.attn_k.weightQ3_K[8192 1024]
-
blk.37.attn_output.weightQ4_K[8192 8192]
-
blk.37.attn_q.weightQ3_K[8192 8192]
-
blk.37.attn_v.weightQ4_K[8192 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.ffn_down.weightQ4_K[22016 8192]
-
blk.38.ffn_gate.weightQ3_K[8192 22016]
-
blk.38.ffn_up.weightQ3_K[8192 22016]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.38.attn_k.weightQ3_K[8192 1024]
-
blk.38.attn_output.weightQ4_K[8192 8192]
-
blk.38.attn_q.weightQ3_K[8192 8192]
-
blk.38.attn_v.weightQ4_K[8192 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.ffn_down.weightQ4_K[22016 8192]
-
blk.39.ffn_gate.weightQ3_K[8192 22016]
-
blk.39.ffn_up.weightQ3_K[8192 22016]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.39.attn_k.weightQ3_K[8192 1024]
-
blk.39.attn_output.weightQ4_K[8192 8192]
-
blk.39.attn_q.weightQ3_K[8192 8192]
-
blk.39.attn_v.weightQ4_K[8192 1024]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.ffn_down.weightQ4_K[22016 8192]
-
blk.40.ffn_gate.weightQ3_K[8192 22016]
-
blk.40.ffn_up.weightQ3_K[8192 22016]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.40.attn_k.weightQ3_K[8192 1024]
-
blk.40.attn_output.weightQ4_K[8192 8192]
-
blk.40.attn_q.weightQ3_K[8192 8192]
-
blk.40.attn_v.weightQ4_K[8192 1024]
-
blk.41.ffn_gate.weightQ3_K[8192 22016]
-
blk.41.ffn_up.weightQ3_K[8192 22016]
-
blk.41.attn_k.weightQ3_K[8192 1024]
-
blk.41.attn_output.weightQ4_K[8192 8192]
-
blk.41.attn_q.weightQ3_K[8192 8192]
-
blk.41.attn_v.weightQ4_K[8192 1024]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.ffn_down.weightQ4_K[22016 8192]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.ffn_down.weightQ4_K[22016 8192]
-
blk.42.ffn_gate.weightQ3_K[8192 22016]
-
blk.42.ffn_up.weightQ3_K[8192 22016]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.42.attn_k.weightQ3_K[8192 1024]
-
blk.42.attn_output.weightQ4_K[8192 8192]
-
blk.42.attn_q.weightQ3_K[8192 8192]
-
blk.42.attn_v.weightQ4_K[8192 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.ffn_down.weightQ4_K[22016 8192]
-
blk.43.ffn_gate.weightQ3_K[8192 22016]
-
blk.43.ffn_up.weightQ3_K[8192 22016]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.43.attn_k.weightQ3_K[8192 1024]
-
blk.43.attn_output.weightQ4_K[8192 8192]
-
blk.43.attn_q.weightQ3_K[8192 8192]
-
blk.43.attn_v.weightQ4_K[8192 1024]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.ffn_down.weightQ4_K[22016 8192]
-
blk.44.ffn_gate.weightQ3_K[8192 22016]
-
blk.44.ffn_up.weightQ3_K[8192 22016]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.44.attn_k.weightQ3_K[8192 1024]
-
blk.44.attn_output.weightQ4_K[8192 8192]
-
blk.44.attn_q.weightQ3_K[8192 8192]
-
blk.44.attn_v.weightQ4_K[8192 1024]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.ffn_down.weightQ4_K[22016 8192]
-
blk.45.ffn_gate.weightQ3_K[8192 22016]
-
blk.45.ffn_up.weightQ3_K[8192 22016]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.attn_k.weightQ3_K[8192 1024]
-
blk.45.attn_output.weightQ4_K[8192 8192]
-
blk.45.attn_q.weightQ3_K[8192 8192]
-
blk.45.attn_v.weightQ4_K[8192 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.ffn_down.weightQ4_K[22016 8192]
-
blk.46.ffn_gate.weightQ3_K[8192 22016]
-
blk.46.ffn_up.weightQ3_K[8192 22016]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.46.attn_k.weightQ3_K[8192 1024]
-
blk.46.attn_output.weightQ4_K[8192 8192]
-
blk.46.attn_q.weightQ3_K[8192 8192]
-
blk.46.attn_v.weightQ4_K[8192 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.ffn_down.weightQ4_K[22016 8192]
-
blk.47.ffn_gate.weightQ3_K[8192 22016]
-
blk.47.ffn_up.weightQ3_K[8192 22016]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.47.attn_k.weightQ3_K[8192 1024]
-
blk.47.attn_output.weightQ4_K[8192 8192]
-
blk.47.attn_q.weightQ3_K[8192 8192]
-
blk.47.attn_v.weightQ4_K[8192 1024]
-
output.weightQ6_K[8192 32000]
-
output_norm.weightF32[8192]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47