latest
7.9GB
13B
7 Pulls Updated 10 months ago
abfb4a5d8680 · 7.9GB
-
general.architecturellama
-
general.file_typeQ4_K_M
-
llama.attention.head_count40
-
llama.attention.head_count_kv40
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count40
-
llama.context_length4096
-
llama.embedding_length5120
-
llama.feed_forward_length13824
-
llama.rope.dimension_count128
-
llama.rope.freq_base10000
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id0
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[2 3 3 6 6 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> <0x00> <0x01> ...]
-
NameTypeShape
-
token_embd.weightQ4_K[5120 32000]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.ffn_down.weightQ6_K[13824 5120]
-
blk.0.ffn_gate.weightQ4_K[5120 13824]
-
blk.0.ffn_up.weightQ4_K[5120 13824]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.0.attn_k.weightQ4_K[5120 5120]
-
blk.0.attn_output.weightQ4_K[5120 5120]
-
blk.0.attn_q.weightQ4_K[5120 5120]
-
blk.0.attn_v.weightQ6_K[5120 5120]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.ffn_down.weightQ6_K[13824 5120]
-
blk.1.ffn_gate.weightQ4_K[5120 13824]
-
blk.1.ffn_up.weightQ4_K[5120 13824]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.attn_k.weightQ4_K[5120 5120]
-
blk.1.attn_output.weightQ4_K[5120 5120]
-
blk.1.attn_q.weightQ4_K[5120 5120]
-
blk.1.attn_v.weightQ6_K[5120 5120]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.ffn_down.weightQ6_K[13824 5120]
-
blk.2.ffn_gate.weightQ4_K[5120 13824]
-
blk.2.ffn_up.weightQ4_K[5120 13824]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.2.attn_k.weightQ4_K[5120 5120]
-
blk.2.attn_output.weightQ4_K[5120 5120]
-
blk.2.attn_q.weightQ4_K[5120 5120]
-
blk.2.attn_v.weightQ6_K[5120 5120]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.ffn_down.weightQ4_K[13824 5120]
-
blk.3.ffn_gate.weightQ4_K[5120 13824]
-
blk.3.ffn_up.weightQ4_K[5120 13824]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.3.attn_k.weightQ4_K[5120 5120]
-
blk.3.attn_output.weightQ4_K[5120 5120]
-
blk.3.attn_q.weightQ4_K[5120 5120]
-
blk.3.attn_v.weightQ4_K[5120 5120]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.ffn_down.weightQ4_K[13824 5120]
-
blk.4.ffn_gate.weightQ4_K[5120 13824]
-
blk.4.ffn_up.weightQ4_K[5120 13824]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.4.attn_k.weightQ4_K[5120 5120]
-
blk.4.attn_output.weightQ4_K[5120 5120]
-
blk.4.attn_q.weightQ4_K[5120 5120]
-
blk.4.attn_v.weightQ4_K[5120 5120]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.ffn_down.weightQ6_K[13824 5120]
-
blk.5.ffn_gate.weightQ4_K[5120 13824]
-
blk.5.ffn_up.weightQ4_K[5120 13824]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.attn_k.weightQ4_K[5120 5120]
-
blk.5.attn_output.weightQ4_K[5120 5120]
-
blk.5.attn_q.weightQ4_K[5120 5120]
-
blk.5.attn_v.weightQ6_K[5120 5120]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.ffn_down.weightQ4_K[13824 5120]
-
blk.6.ffn_gate.weightQ4_K[5120 13824]
-
blk.6.ffn_up.weightQ4_K[5120 13824]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.6.attn_k.weightQ4_K[5120 5120]
-
blk.6.attn_output.weightQ4_K[5120 5120]
-
blk.6.attn_q.weightQ4_K[5120 5120]
-
blk.6.attn_v.weightQ4_K[5120 5120]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.ffn_down.weightQ4_K[13824 5120]
-
blk.7.ffn_gate.weightQ4_K[5120 13824]
-
blk.7.ffn_up.weightQ4_K[5120 13824]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.attn_k.weightQ4_K[5120 5120]
-
blk.7.attn_output.weightQ4_K[5120 5120]
-
blk.7.attn_q.weightQ4_K[5120 5120]
-
blk.7.attn_v.weightQ4_K[5120 5120]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.ffn_down.weightQ6_K[13824 5120]
-
blk.8.ffn_gate.weightQ4_K[5120 13824]
-
blk.8.ffn_up.weightQ4_K[5120 13824]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.8.attn_k.weightQ4_K[5120 5120]
-
blk.8.attn_output.weightQ4_K[5120 5120]
-
blk.8.attn_q.weightQ4_K[5120 5120]
-
blk.8.attn_v.weightQ6_K[5120 5120]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.ffn_down.weightQ4_K[13824 5120]
-
blk.9.ffn_gate.weightQ4_K[5120 13824]
-
blk.9.ffn_up.weightQ4_K[5120 13824]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.attn_k.weightQ4_K[5120 5120]
-
blk.9.attn_output.weightQ4_K[5120 5120]
-
blk.9.attn_q.weightQ4_K[5120 5120]
-
blk.9.attn_v.weightQ4_K[5120 5120]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.ffn_down.weightQ6_K[13824 5120]
-
blk.10.ffn_gate.weightQ4_K[5120 13824]
-
blk.10.ffn_up.weightQ4_K[5120 13824]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.10.attn_k.weightQ4_K[5120 5120]
-
blk.10.attn_output.weightQ4_K[5120 5120]
-
blk.10.attn_q.weightQ4_K[5120 5120]
-
blk.10.attn_v.weightQ6_K[5120 5120]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.ffn_down.weightQ6_K[13824 5120]
-
blk.11.ffn_gate.weightQ4_K[5120 13824]
-
blk.11.ffn_up.weightQ4_K[5120 13824]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.attn_k.weightQ4_K[5120 5120]
-
blk.11.attn_output.weightQ4_K[5120 5120]
-
blk.11.attn_q.weightQ4_K[5120 5120]
-
blk.11.attn_v.weightQ6_K[5120 5120]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.ffn_down.weightQ6_K[13824 5120]
-
blk.12.ffn_gate.weightQ4_K[5120 13824]
-
blk.12.ffn_up.weightQ4_K[5120 13824]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.12.attn_k.weightQ4_K[5120 5120]
-
blk.12.attn_output.weightQ4_K[5120 5120]
-
blk.12.attn_q.weightQ4_K[5120 5120]
-
blk.12.attn_v.weightQ6_K[5120 5120]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.ffn_down.weightQ4_K[13824 5120]
-
blk.13.ffn_gate.weightQ4_K[5120 13824]
-
blk.13.ffn_up.weightQ4_K[5120 13824]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.13.attn_k.weightQ4_K[5120 5120]
-
blk.13.attn_output.weightQ4_K[5120 5120]
-
blk.13.attn_q.weightQ4_K[5120 5120]
-
blk.13.attn_v.weightQ4_K[5120 5120]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.ffn_down.weightQ4_K[13824 5120]
-
blk.14.ffn_gate.weightQ4_K[5120 13824]
-
blk.14.ffn_up.weightQ4_K[5120 13824]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.14.attn_k.weightQ4_K[5120 5120]
-
blk.14.attn_output.weightQ4_K[5120 5120]
-
blk.14.attn_q.weightQ4_K[5120 5120]
-
blk.14.attn_v.weightQ4_K[5120 5120]
-
blk.15.attn_k.weightQ4_K[5120 5120]
-
blk.15.attn_q.weightQ4_K[5120 5120]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.ffn_down.weightQ4_K[13824 5120]
-
blk.15.ffn_gate.weightQ4_K[5120 13824]
-
blk.15.ffn_up.weightQ4_K[5120 13824]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.15.attn_output.weightQ4_K[5120 5120]
-
blk.15.attn_v.weightQ4_K[5120 5120]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.ffn_down.weightQ6_K[13824 5120]
-
blk.16.ffn_gate.weightQ4_K[5120 13824]
-
blk.16.ffn_up.weightQ4_K[5120 13824]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.16.attn_k.weightQ4_K[5120 5120]
-
blk.16.attn_output.weightQ4_K[5120 5120]
-
blk.16.attn_q.weightQ4_K[5120 5120]
-
blk.16.attn_v.weightQ6_K[5120 5120]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.ffn_down.weightQ4_K[13824 5120]
-
blk.17.ffn_gate.weightQ4_K[5120 13824]
-
blk.17.ffn_up.weightQ4_K[5120 13824]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.attn_k.weightQ4_K[5120 5120]
-
blk.17.attn_output.weightQ4_K[5120 5120]
-
blk.17.attn_q.weightQ4_K[5120 5120]
-
blk.17.attn_v.weightQ4_K[5120 5120]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.ffn_down.weightQ4_K[13824 5120]
-
blk.18.ffn_gate.weightQ4_K[5120 13824]
-
blk.18.ffn_up.weightQ4_K[5120 13824]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.18.attn_k.weightQ4_K[5120 5120]
-
blk.18.attn_output.weightQ4_K[5120 5120]
-
blk.18.attn_q.weightQ4_K[5120 5120]
-
blk.18.attn_v.weightQ4_K[5120 5120]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.ffn_down.weightQ6_K[13824 5120]
-
blk.19.ffn_gate.weightQ4_K[5120 13824]
-
blk.19.ffn_up.weightQ4_K[5120 13824]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.attn_k.weightQ4_K[5120 5120]
-
blk.19.attn_output.weightQ4_K[5120 5120]
-
blk.19.attn_q.weightQ4_K[5120 5120]
-
blk.19.attn_v.weightQ6_K[5120 5120]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.ffn_down.weightQ4_K[13824 5120]
-
blk.20.ffn_gate.weightQ4_K[5120 13824]
-
blk.20.ffn_up.weightQ4_K[5120 13824]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.20.attn_k.weightQ4_K[5120 5120]
-
blk.20.attn_output.weightQ4_K[5120 5120]
-
blk.20.attn_q.weightQ4_K[5120 5120]
-
blk.20.attn_v.weightQ4_K[5120 5120]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.ffn_down.weightQ4_K[13824 5120]
-
blk.21.ffn_gate.weightQ4_K[5120 13824]
-
blk.21.ffn_up.weightQ4_K[5120 13824]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.21.attn_k.weightQ4_K[5120 5120]
-
blk.21.attn_output.weightQ4_K[5120 5120]
-
blk.21.attn_q.weightQ4_K[5120 5120]
-
blk.21.attn_v.weightQ4_K[5120 5120]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.ffn_down.weightQ6_K[13824 5120]
-
blk.22.ffn_gate.weightQ4_K[5120 13824]
-
blk.22.ffn_up.weightQ4_K[5120 13824]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.22.attn_k.weightQ4_K[5120 5120]
-
blk.22.attn_output.weightQ4_K[5120 5120]
-
blk.22.attn_q.weightQ4_K[5120 5120]
-
blk.22.attn_v.weightQ6_K[5120 5120]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.ffn_down.weightQ4_K[13824 5120]
-
blk.23.ffn_gate.weightQ4_K[5120 13824]
-
blk.23.ffn_up.weightQ4_K[5120 13824]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.23.attn_k.weightQ4_K[5120 5120]
-
blk.23.attn_output.weightQ4_K[5120 5120]
-
blk.23.attn_q.weightQ4_K[5120 5120]
-
blk.23.attn_v.weightQ4_K[5120 5120]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.ffn_down.weightQ4_K[13824 5120]
-
blk.24.ffn_gate.weightQ4_K[5120 13824]
-
blk.24.ffn_up.weightQ4_K[5120 13824]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.24.attn_k.weightQ4_K[5120 5120]
-
blk.24.attn_output.weightQ4_K[5120 5120]
-
blk.24.attn_q.weightQ4_K[5120 5120]
-
blk.24.attn_v.weightQ4_K[5120 5120]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.ffn_down.weightQ6_K[13824 5120]
-
blk.25.ffn_gate.weightQ4_K[5120 13824]
-
blk.25.ffn_up.weightQ4_K[5120 13824]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.attn_k.weightQ4_K[5120 5120]
-
blk.25.attn_output.weightQ4_K[5120 5120]
-
blk.25.attn_q.weightQ4_K[5120 5120]
-
blk.25.attn_v.weightQ6_K[5120 5120]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.ffn_down.weightQ4_K[13824 5120]
-
blk.26.ffn_gate.weightQ4_K[5120 13824]
-
blk.26.ffn_up.weightQ4_K[5120 13824]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.26.attn_k.weightQ4_K[5120 5120]
-
blk.26.attn_output.weightQ4_K[5120 5120]
-
blk.26.attn_q.weightQ4_K[5120 5120]
-
blk.26.attn_v.weightQ4_K[5120 5120]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.ffn_down.weightQ4_K[13824 5120]
-
blk.27.ffn_gate.weightQ4_K[5120 13824]
-
blk.27.ffn_up.weightQ4_K[5120 13824]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.attn_k.weightQ4_K[5120 5120]
-
blk.27.attn_output.weightQ4_K[5120 5120]
-
blk.27.attn_q.weightQ4_K[5120 5120]
-
blk.27.attn_v.weightQ4_K[5120 5120]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.ffn_down.weightQ6_K[13824 5120]
-
blk.28.ffn_gate.weightQ4_K[5120 13824]
-
blk.28.ffn_up.weightQ4_K[5120 13824]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.28.attn_k.weightQ4_K[5120 5120]
-
blk.28.attn_output.weightQ4_K[5120 5120]
-
blk.28.attn_q.weightQ4_K[5120 5120]
-
blk.28.attn_v.weightQ6_K[5120 5120]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.ffn_down.weightQ4_K[13824 5120]
-
blk.29.ffn_gate.weightQ4_K[5120 13824]
-
blk.29.ffn_up.weightQ4_K[5120 13824]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.attn_k.weightQ4_K[5120 5120]
-
blk.29.attn_output.weightQ4_K[5120 5120]
-
blk.29.attn_q.weightQ4_K[5120 5120]
-
blk.29.attn_v.weightQ4_K[5120 5120]
-
blk.30.ffn_gate.weightQ4_K[5120 13824]
-
blk.30.ffn_up.weightQ4_K[5120 13824]
-
blk.30.attn_k.weightQ4_K[5120 5120]
-
blk.30.attn_output.weightQ4_K[5120 5120]
-
blk.30.attn_q.weightQ4_K[5120 5120]
-
blk.30.attn_v.weightQ4_K[5120 5120]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.ffn_down.weightQ4_K[13824 5120]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.ffn_down.weightQ6_K[13824 5120]
-
blk.31.ffn_gate.weightQ4_K[5120 13824]
-
blk.31.ffn_up.weightQ4_K[5120 13824]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.attn_k.weightQ4_K[5120 5120]
-
blk.31.attn_output.weightQ4_K[5120 5120]
-
blk.31.attn_q.weightQ4_K[5120 5120]
-
blk.31.attn_v.weightQ6_K[5120 5120]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.ffn_down.weightQ4_K[13824 5120]
-
blk.32.ffn_gate.weightQ4_K[5120 13824]
-
blk.32.ffn_up.weightQ4_K[5120 13824]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.32.attn_k.weightQ4_K[5120 5120]
-
blk.32.attn_output.weightQ4_K[5120 5120]
-
blk.32.attn_q.weightQ4_K[5120 5120]
-
blk.32.attn_v.weightQ4_K[5120 5120]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.ffn_down.weightQ4_K[13824 5120]
-
blk.33.ffn_gate.weightQ4_K[5120 13824]
-
blk.33.ffn_up.weightQ4_K[5120 13824]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.33.attn_k.weightQ4_K[5120 5120]
-
blk.33.attn_output.weightQ4_K[5120 5120]
-
blk.33.attn_q.weightQ4_K[5120 5120]
-
blk.33.attn_v.weightQ4_K[5120 5120]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.ffn_down.weightQ6_K[13824 5120]
-
blk.34.ffn_gate.weightQ4_K[5120 13824]
-
blk.34.ffn_up.weightQ4_K[5120 13824]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.34.attn_k.weightQ4_K[5120 5120]
-
blk.34.attn_output.weightQ4_K[5120 5120]
-
blk.34.attn_q.weightQ4_K[5120 5120]
-
blk.34.attn_v.weightQ6_K[5120 5120]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.ffn_down.weightQ6_K[13824 5120]
-
blk.35.ffn_gate.weightQ4_K[5120 13824]
-
blk.35.ffn_up.weightQ4_K[5120 13824]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.35.attn_k.weightQ4_K[5120 5120]
-
blk.35.attn_output.weightQ4_K[5120 5120]
-
blk.35.attn_q.weightQ4_K[5120 5120]
-
blk.35.attn_v.weightQ6_K[5120 5120]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.ffn_down.weightQ6_K[13824 5120]
-
blk.36.ffn_gate.weightQ4_K[5120 13824]
-
blk.36.ffn_up.weightQ4_K[5120 13824]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.36.attn_k.weightQ4_K[5120 5120]
-
blk.36.attn_output.weightQ4_K[5120 5120]
-
blk.36.attn_q.weightQ4_K[5120 5120]
-
blk.36.attn_v.weightQ6_K[5120 5120]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.ffn_down.weightQ6_K[13824 5120]
-
blk.37.ffn_gate.weightQ4_K[5120 13824]
-
blk.37.ffn_up.weightQ4_K[5120 13824]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.attn_k.weightQ4_K[5120 5120]
-
blk.37.attn_output.weightQ4_K[5120 5120]
-
blk.37.attn_q.weightQ4_K[5120 5120]
-
blk.37.attn_v.weightQ6_K[5120 5120]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.ffn_down.weightQ6_K[13824 5120]
-
blk.38.ffn_gate.weightQ4_K[5120 13824]
-
blk.38.ffn_up.weightQ4_K[5120 13824]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.38.attn_k.weightQ4_K[5120 5120]
-
blk.38.attn_output.weightQ4_K[5120 5120]
-
blk.38.attn_q.weightQ4_K[5120 5120]
-
blk.38.attn_v.weightQ6_K[5120 5120]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.ffn_down.weightQ6_K[13824 5120]
-
blk.39.ffn_gate.weightQ4_K[5120 13824]
-
blk.39.ffn_up.weightQ4_K[5120 13824]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.attn_k.weightQ4_K[5120 5120]
-
blk.39.attn_output.weightQ4_K[5120 5120]
-
blk.39.attn_q.weightQ4_K[5120 5120]
-
blk.39.attn_v.weightQ6_K[5120 5120]
-
output.weightQ6_K[5120 32000]
-
output_norm.weightF32[5120]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39