Codelama with 16k context unlocked in modelfile
13B
34B
173 Pulls Updated 10 months ago
e73cc17c7181 · 7.4GB
-
general.architecturellama
-
general.file_typeQ4_0
-
llama.attention.head_count40
-
llama.attention.head_count_kv40
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count40
-
llama.context_length16384
-
llama.embedding_length5120
-
llama.feed_forward_length13824
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+06
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[2 3 3 6 6 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> <0x00> <0x01> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ4_0[5120 32016]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.ffn_down.weightQ4_0[13824 5120]
-
blk.0.ffn_gate.weightQ4_0[5120 13824]
-
blk.0.ffn_up.weightQ4_0[5120 13824]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.0.attn_k.weightQ4_0[5120 5120]
-
blk.0.attn_output.weightQ4_0[5120 5120]
-
blk.0.attn_q.weightQ4_0[5120 5120]
-
blk.0.attn_v.weightQ4_0[5120 5120]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.ffn_down.weightQ4_0[13824 5120]
-
blk.1.ffn_gate.weightQ4_0[5120 13824]
-
blk.1.ffn_up.weightQ4_0[5120 13824]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.attn_k.weightQ4_0[5120 5120]
-
blk.1.attn_output.weightQ4_0[5120 5120]
-
blk.1.attn_q.weightQ4_0[5120 5120]
-
blk.1.attn_v.weightQ4_0[5120 5120]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.ffn_down.weightQ4_0[13824 5120]
-
blk.2.ffn_gate.weightQ4_0[5120 13824]
-
blk.2.ffn_up.weightQ4_0[5120 13824]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.2.attn_k.weightQ4_0[5120 5120]
-
blk.2.attn_output.weightQ4_0[5120 5120]
-
blk.2.attn_q.weightQ4_0[5120 5120]
-
blk.2.attn_v.weightQ4_0[5120 5120]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.ffn_down.weightQ4_0[13824 5120]
-
blk.3.ffn_gate.weightQ4_0[5120 13824]
-
blk.3.ffn_up.weightQ4_0[5120 13824]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.3.attn_k.weightQ4_0[5120 5120]
-
blk.3.attn_output.weightQ4_0[5120 5120]
-
blk.3.attn_q.weightQ4_0[5120 5120]
-
blk.3.attn_v.weightQ4_0[5120 5120]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.ffn_down.weightQ4_0[13824 5120]
-
blk.4.ffn_gate.weightQ4_0[5120 13824]
-
blk.4.ffn_up.weightQ4_0[5120 13824]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.4.attn_k.weightQ4_0[5120 5120]
-
blk.4.attn_output.weightQ4_0[5120 5120]
-
blk.4.attn_q.weightQ4_0[5120 5120]
-
blk.4.attn_v.weightQ4_0[5120 5120]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.ffn_down.weightQ4_0[13824 5120]
-
blk.5.ffn_gate.weightQ4_0[5120 13824]
-
blk.5.ffn_up.weightQ4_0[5120 13824]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.attn_k.weightQ4_0[5120 5120]
-
blk.5.attn_output.weightQ4_0[5120 5120]
-
blk.5.attn_q.weightQ4_0[5120 5120]
-
blk.5.attn_v.weightQ4_0[5120 5120]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.ffn_down.weightQ4_0[13824 5120]
-
blk.6.ffn_gate.weightQ4_0[5120 13824]
-
blk.6.ffn_up.weightQ4_0[5120 13824]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.6.attn_k.weightQ4_0[5120 5120]
-
blk.6.attn_output.weightQ4_0[5120 5120]
-
blk.6.attn_q.weightQ4_0[5120 5120]
-
blk.6.attn_v.weightQ4_0[5120 5120]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.ffn_down.weightQ4_0[13824 5120]
-
blk.7.ffn_gate.weightQ4_0[5120 13824]
-
blk.7.ffn_up.weightQ4_0[5120 13824]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.attn_k.weightQ4_0[5120 5120]
-
blk.7.attn_output.weightQ4_0[5120 5120]
-
blk.7.attn_q.weightQ4_0[5120 5120]
-
blk.7.attn_v.weightQ4_0[5120 5120]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.ffn_down.weightQ4_0[13824 5120]
-
blk.8.ffn_gate.weightQ4_0[5120 13824]
-
blk.8.ffn_up.weightQ4_0[5120 13824]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.8.attn_k.weightQ4_0[5120 5120]
-
blk.8.attn_output.weightQ4_0[5120 5120]
-
blk.8.attn_q.weightQ4_0[5120 5120]
-
blk.8.attn_v.weightQ4_0[5120 5120]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.ffn_down.weightQ4_0[13824 5120]
-
blk.9.ffn_gate.weightQ4_0[5120 13824]
-
blk.9.ffn_up.weightQ4_0[5120 13824]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.attn_k.weightQ4_0[5120 5120]
-
blk.9.attn_output.weightQ4_0[5120 5120]
-
blk.9.attn_q.weightQ4_0[5120 5120]
-
blk.9.attn_v.weightQ4_0[5120 5120]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.ffn_down.weightQ4_0[13824 5120]
-
blk.10.ffn_gate.weightQ4_0[5120 13824]
-
blk.10.ffn_up.weightQ4_0[5120 13824]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.10.attn_k.weightQ4_0[5120 5120]
-
blk.10.attn_output.weightQ4_0[5120 5120]
-
blk.10.attn_q.weightQ4_0[5120 5120]
-
blk.10.attn_v.weightQ4_0[5120 5120]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.ffn_down.weightQ4_0[13824 5120]
-
blk.11.ffn_gate.weightQ4_0[5120 13824]
-
blk.11.ffn_up.weightQ4_0[5120 13824]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.attn_k.weightQ4_0[5120 5120]
-
blk.11.attn_output.weightQ4_0[5120 5120]
-
blk.11.attn_q.weightQ4_0[5120 5120]
-
blk.11.attn_v.weightQ4_0[5120 5120]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.ffn_down.weightQ4_0[13824 5120]
-
blk.12.ffn_gate.weightQ4_0[5120 13824]
-
blk.12.ffn_up.weightQ4_0[5120 13824]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.12.attn_k.weightQ4_0[5120 5120]
-
blk.12.attn_output.weightQ4_0[5120 5120]
-
blk.12.attn_q.weightQ4_0[5120 5120]
-
blk.12.attn_v.weightQ4_0[5120 5120]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.ffn_down.weightQ4_0[13824 5120]
-
blk.13.ffn_gate.weightQ4_0[5120 13824]
-
blk.13.ffn_up.weightQ4_0[5120 13824]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.13.attn_k.weightQ4_0[5120 5120]
-
blk.13.attn_output.weightQ4_0[5120 5120]
-
blk.13.attn_q.weightQ4_0[5120 5120]
-
blk.13.attn_v.weightQ4_0[5120 5120]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.ffn_down.weightQ4_0[13824 5120]
-
blk.14.ffn_gate.weightQ4_0[5120 13824]
-
blk.14.ffn_up.weightQ4_0[5120 13824]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.14.attn_k.weightQ4_0[5120 5120]
-
blk.14.attn_output.weightQ4_0[5120 5120]
-
blk.14.attn_q.weightQ4_0[5120 5120]
-
blk.14.attn_v.weightQ4_0[5120 5120]
-
blk.15.attn_k.weightQ4_0[5120 5120]
-
blk.15.attn_q.weightQ4_0[5120 5120]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.ffn_down.weightQ4_0[13824 5120]
-
blk.15.ffn_gate.weightQ4_0[5120 13824]
-
blk.15.ffn_up.weightQ4_0[5120 13824]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.15.attn_output.weightQ4_0[5120 5120]
-
blk.15.attn_v.weightQ4_0[5120 5120]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.ffn_down.weightQ4_0[13824 5120]
-
blk.16.ffn_gate.weightQ4_0[5120 13824]
-
blk.16.ffn_up.weightQ4_0[5120 13824]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.16.attn_k.weightQ4_0[5120 5120]
-
blk.16.attn_output.weightQ4_0[5120 5120]
-
blk.16.attn_q.weightQ4_0[5120 5120]
-
blk.16.attn_v.weightQ4_0[5120 5120]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.ffn_down.weightQ4_0[13824 5120]
-
blk.17.ffn_gate.weightQ4_0[5120 13824]
-
blk.17.ffn_up.weightQ4_0[5120 13824]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.attn_k.weightQ4_0[5120 5120]
-
blk.17.attn_output.weightQ4_0[5120 5120]
-
blk.17.attn_q.weightQ4_0[5120 5120]
-
blk.17.attn_v.weightQ4_0[5120 5120]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.ffn_down.weightQ4_0[13824 5120]
-
blk.18.ffn_gate.weightQ4_0[5120 13824]
-
blk.18.ffn_up.weightQ4_0[5120 13824]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.18.attn_k.weightQ4_0[5120 5120]
-
blk.18.attn_output.weightQ4_0[5120 5120]
-
blk.18.attn_q.weightQ4_0[5120 5120]
-
blk.18.attn_v.weightQ4_0[5120 5120]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.ffn_down.weightQ4_0[13824 5120]
-
blk.19.ffn_gate.weightQ4_0[5120 13824]
-
blk.19.ffn_up.weightQ4_0[5120 13824]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.attn_k.weightQ4_0[5120 5120]
-
blk.19.attn_output.weightQ4_0[5120 5120]
-
blk.19.attn_q.weightQ4_0[5120 5120]
-
blk.19.attn_v.weightQ4_0[5120 5120]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.ffn_down.weightQ4_0[13824 5120]
-
blk.20.ffn_gate.weightQ4_0[5120 13824]
-
blk.20.ffn_up.weightQ4_0[5120 13824]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.20.attn_k.weightQ4_0[5120 5120]
-
blk.20.attn_output.weightQ4_0[5120 5120]
-
blk.20.attn_q.weightQ4_0[5120 5120]
-
blk.20.attn_v.weightQ4_0[5120 5120]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.ffn_down.weightQ4_0[13824 5120]
-
blk.21.ffn_gate.weightQ4_0[5120 13824]
-
blk.21.ffn_up.weightQ4_0[5120 13824]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.21.attn_k.weightQ4_0[5120 5120]
-
blk.21.attn_output.weightQ4_0[5120 5120]
-
blk.21.attn_q.weightQ4_0[5120 5120]
-
blk.21.attn_v.weightQ4_0[5120 5120]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.ffn_down.weightQ4_0[13824 5120]
-
blk.22.ffn_gate.weightQ4_0[5120 13824]
-
blk.22.ffn_up.weightQ4_0[5120 13824]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.22.attn_k.weightQ4_0[5120 5120]
-
blk.22.attn_output.weightQ4_0[5120 5120]
-
blk.22.attn_q.weightQ4_0[5120 5120]
-
blk.22.attn_v.weightQ4_0[5120 5120]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.ffn_down.weightQ4_0[13824 5120]
-
blk.23.ffn_gate.weightQ4_0[5120 13824]
-
blk.23.ffn_up.weightQ4_0[5120 13824]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.23.attn_k.weightQ4_0[5120 5120]
-
blk.23.attn_output.weightQ4_0[5120 5120]
-
blk.23.attn_q.weightQ4_0[5120 5120]
-
blk.23.attn_v.weightQ4_0[5120 5120]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.ffn_down.weightQ4_0[13824 5120]
-
blk.24.ffn_gate.weightQ4_0[5120 13824]
-
blk.24.ffn_up.weightQ4_0[5120 13824]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.24.attn_k.weightQ4_0[5120 5120]
-
blk.24.attn_output.weightQ4_0[5120 5120]
-
blk.24.attn_q.weightQ4_0[5120 5120]
-
blk.24.attn_v.weightQ4_0[5120 5120]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.ffn_down.weightQ4_0[13824 5120]
-
blk.25.ffn_gate.weightQ4_0[5120 13824]
-
blk.25.ffn_up.weightQ4_0[5120 13824]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.attn_k.weightQ4_0[5120 5120]
-
blk.25.attn_output.weightQ4_0[5120 5120]
-
blk.25.attn_q.weightQ4_0[5120 5120]
-
blk.25.attn_v.weightQ4_0[5120 5120]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.ffn_down.weightQ4_0[13824 5120]
-
blk.26.ffn_gate.weightQ4_0[5120 13824]
-
blk.26.ffn_up.weightQ4_0[5120 13824]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.26.attn_k.weightQ4_0[5120 5120]
-
blk.26.attn_output.weightQ4_0[5120 5120]
-
blk.26.attn_q.weightQ4_0[5120 5120]
-
blk.26.attn_v.weightQ4_0[5120 5120]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.ffn_down.weightQ4_0[13824 5120]
-
blk.27.ffn_gate.weightQ4_0[5120 13824]
-
blk.27.ffn_up.weightQ4_0[5120 13824]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.attn_k.weightQ4_0[5120 5120]
-
blk.27.attn_output.weightQ4_0[5120 5120]
-
blk.27.attn_q.weightQ4_0[5120 5120]
-
blk.27.attn_v.weightQ4_0[5120 5120]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.ffn_down.weightQ4_0[13824 5120]
-
blk.28.ffn_gate.weightQ4_0[5120 13824]
-
blk.28.ffn_up.weightQ4_0[5120 13824]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.28.attn_k.weightQ4_0[5120 5120]
-
blk.28.attn_output.weightQ4_0[5120 5120]
-
blk.28.attn_q.weightQ4_0[5120 5120]
-
blk.28.attn_v.weightQ4_0[5120 5120]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.ffn_down.weightQ4_0[13824 5120]
-
blk.29.ffn_gate.weightQ4_0[5120 13824]
-
blk.29.ffn_up.weightQ4_0[5120 13824]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.attn_k.weightQ4_0[5120 5120]
-
blk.29.attn_output.weightQ4_0[5120 5120]
-
blk.29.attn_q.weightQ4_0[5120 5120]
-
blk.29.attn_v.weightQ4_0[5120 5120]
-
blk.30.ffn_gate.weightQ4_0[5120 13824]
-
blk.30.ffn_up.weightQ4_0[5120 13824]
-
blk.30.attn_k.weightQ4_0[5120 5120]
-
blk.30.attn_output.weightQ4_0[5120 5120]
-
blk.30.attn_q.weightQ4_0[5120 5120]
-
blk.30.attn_v.weightQ4_0[5120 5120]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.ffn_down.weightQ4_0[13824 5120]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.ffn_down.weightQ4_0[13824 5120]
-
blk.31.ffn_gate.weightQ4_0[5120 13824]
-
blk.31.ffn_up.weightQ4_0[5120 13824]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.attn_k.weightQ4_0[5120 5120]
-
blk.31.attn_output.weightQ4_0[5120 5120]
-
blk.31.attn_q.weightQ4_0[5120 5120]
-
blk.31.attn_v.weightQ4_0[5120 5120]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.ffn_down.weightQ4_0[13824 5120]
-
blk.32.ffn_gate.weightQ4_0[5120 13824]
-
blk.32.ffn_up.weightQ4_0[5120 13824]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.32.attn_k.weightQ4_0[5120 5120]
-
blk.32.attn_output.weightQ4_0[5120 5120]
-
blk.32.attn_q.weightQ4_0[5120 5120]
-
blk.32.attn_v.weightQ4_0[5120 5120]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.ffn_down.weightQ4_0[13824 5120]
-
blk.33.ffn_gate.weightQ4_0[5120 13824]
-
blk.33.ffn_up.weightQ4_0[5120 13824]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.33.attn_k.weightQ4_0[5120 5120]
-
blk.33.attn_output.weightQ4_0[5120 5120]
-
blk.33.attn_q.weightQ4_0[5120 5120]
-
blk.33.attn_v.weightQ4_0[5120 5120]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.ffn_down.weightQ4_0[13824 5120]
-
blk.34.ffn_gate.weightQ4_0[5120 13824]
-
blk.34.ffn_up.weightQ4_0[5120 13824]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.34.attn_k.weightQ4_0[5120 5120]
-
blk.34.attn_output.weightQ4_0[5120 5120]
-
blk.34.attn_q.weightQ4_0[5120 5120]
-
blk.34.attn_v.weightQ4_0[5120 5120]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.ffn_down.weightQ4_0[13824 5120]
-
blk.35.ffn_gate.weightQ4_0[5120 13824]
-
blk.35.ffn_up.weightQ4_0[5120 13824]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.35.attn_k.weightQ4_0[5120 5120]
-
blk.35.attn_output.weightQ4_0[5120 5120]
-
blk.35.attn_q.weightQ4_0[5120 5120]
-
blk.35.attn_v.weightQ4_0[5120 5120]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.ffn_down.weightQ4_0[13824 5120]
-
blk.36.ffn_gate.weightQ4_0[5120 13824]
-
blk.36.ffn_up.weightQ4_0[5120 13824]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.36.attn_k.weightQ4_0[5120 5120]
-
blk.36.attn_output.weightQ4_0[5120 5120]
-
blk.36.attn_q.weightQ4_0[5120 5120]
-
blk.36.attn_v.weightQ4_0[5120 5120]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.ffn_down.weightQ4_0[13824 5120]
-
blk.37.ffn_gate.weightQ4_0[5120 13824]
-
blk.37.ffn_up.weightQ4_0[5120 13824]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.attn_k.weightQ4_0[5120 5120]
-
blk.37.attn_output.weightQ4_0[5120 5120]
-
blk.37.attn_q.weightQ4_0[5120 5120]
-
blk.37.attn_v.weightQ4_0[5120 5120]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.ffn_down.weightQ4_0[13824 5120]
-
blk.38.ffn_gate.weightQ4_0[5120 13824]
-
blk.38.ffn_up.weightQ4_0[5120 13824]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.38.attn_k.weightQ4_0[5120 5120]
-
blk.38.attn_output.weightQ4_0[5120 5120]
-
blk.38.attn_q.weightQ4_0[5120 5120]
-
blk.38.attn_v.weightQ4_0[5120 5120]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.ffn_down.weightQ4_0[13824 5120]
-
blk.39.ffn_gate.weightQ4_0[5120 13824]
-
blk.39.ffn_up.weightQ4_0[5120 13824]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.attn_k.weightQ4_0[5120 5120]
-
blk.39.attn_output.weightQ4_0[5120 5120]
-
blk.39.attn_q.weightQ4_0[5120 5120]
-
blk.39.attn_v.weightQ4_0[5120 5120]
-
output.weightQ6_K[5120 32016]
-
output_norm.weightF32[5120]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39