13B
97 Pulls Updated 12 months ago
32762b3692dd · 6.3GB
-
general.architecturellama
-
general.file_typeQ3_K_M
-
llama.attention.head_count40
-
llama.attention.head_count_kv40
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count40
-
llama.context_length4096
-
llama.embedding_length5120
-
llama.feed_forward_length13824
-
llama.rope.dimension_count128
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[2 3 3 6 6 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> <0x00> <0x01> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ3_K[5120 32032]
-
blk.0.attn_q.weightQ3_K[5120 5120]
-
blk.0.attn_k.weightQ3_K[5120 5120]
-
blk.0.attn_v.weightQ5_K[5120 5120]
-
blk.0.attn_output.weightQ4_K[5120 5120]
-
blk.0.ffn_gate.weightQ3_K[5120 13824]
-
blk.0.ffn_down.weightQ5_K[13824 5120]
-
blk.0.ffn_up.weightQ3_K[5120 13824]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.1.attn_q.weightQ3_K[5120 5120]
-
blk.1.attn_k.weightQ3_K[5120 5120]
-
blk.1.attn_v.weightQ5_K[5120 5120]
-
blk.1.attn_output.weightQ4_K[5120 5120]
-
blk.1.ffn_gate.weightQ3_K[5120 13824]
-
blk.1.ffn_down.weightQ5_K[13824 5120]
-
blk.1.ffn_up.weightQ3_K[5120 13824]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.2.attn_q.weightQ3_K[5120 5120]
-
blk.2.attn_k.weightQ3_K[5120 5120]
-
blk.2.attn_v.weightQ4_K[5120 5120]
-
blk.2.attn_output.weightQ4_K[5120 5120]
-
blk.2.ffn_gate.weightQ3_K[5120 13824]
-
blk.2.ffn_down.weightQ4_K[13824 5120]
-
blk.2.ffn_up.weightQ3_K[5120 13824]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.3.attn_q.weightQ3_K[5120 5120]
-
blk.3.attn_k.weightQ3_K[5120 5120]
-
blk.3.attn_v.weightQ4_K[5120 5120]
-
blk.3.attn_output.weightQ4_K[5120 5120]
-
blk.3.ffn_gate.weightQ3_K[5120 13824]
-
blk.3.ffn_down.weightQ4_K[13824 5120]
-
blk.3.ffn_up.weightQ3_K[5120 13824]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.4.attn_q.weightQ3_K[5120 5120]
-
blk.4.attn_k.weightQ3_K[5120 5120]
-
blk.4.attn_v.weightQ4_K[5120 5120]
-
blk.4.attn_output.weightQ4_K[5120 5120]
-
blk.4.ffn_gate.weightQ3_K[5120 13824]
-
blk.4.ffn_down.weightQ4_K[13824 5120]
-
blk.4.ffn_up.weightQ3_K[5120 13824]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.5.attn_q.weightQ3_K[5120 5120]
-
blk.5.attn_k.weightQ3_K[5120 5120]
-
blk.5.attn_v.weightQ4_K[5120 5120]
-
blk.5.attn_output.weightQ4_K[5120 5120]
-
blk.5.ffn_gate.weightQ3_K[5120 13824]
-
blk.5.ffn_down.weightQ4_K[13824 5120]
-
blk.5.ffn_up.weightQ3_K[5120 13824]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.6.attn_q.weightQ3_K[5120 5120]
-
blk.6.attn_k.weightQ3_K[5120 5120]
-
blk.6.attn_v.weightQ4_K[5120 5120]
-
blk.6.attn_output.weightQ4_K[5120 5120]
-
blk.6.ffn_gate.weightQ3_K[5120 13824]
-
blk.6.ffn_down.weightQ4_K[13824 5120]
-
blk.6.ffn_up.weightQ3_K[5120 13824]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.7.attn_q.weightQ3_K[5120 5120]
-
blk.7.attn_k.weightQ3_K[5120 5120]
-
blk.7.attn_v.weightQ4_K[5120 5120]
-
blk.7.attn_output.weightQ4_K[5120 5120]
-
blk.7.ffn_gate.weightQ3_K[5120 13824]
-
blk.7.ffn_down.weightQ4_K[13824 5120]
-
blk.7.ffn_up.weightQ3_K[5120 13824]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.8.attn_q.weightQ3_K[5120 5120]
-
blk.8.attn_k.weightQ3_K[5120 5120]
-
blk.8.attn_v.weightQ4_K[5120 5120]
-
blk.8.attn_output.weightQ4_K[5120 5120]
-
blk.8.ffn_gate.weightQ3_K[5120 13824]
-
blk.8.ffn_down.weightQ4_K[13824 5120]
-
blk.8.ffn_up.weightQ3_K[5120 13824]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.9.attn_q.weightQ3_K[5120 5120]
-
blk.9.attn_k.weightQ3_K[5120 5120]
-
blk.9.attn_v.weightQ4_K[5120 5120]
-
blk.9.attn_output.weightQ4_K[5120 5120]
-
blk.9.ffn_gate.weightQ3_K[5120 13824]
-
blk.9.ffn_down.weightQ4_K[13824 5120]
-
blk.9.ffn_up.weightQ3_K[5120 13824]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.10.attn_q.weightQ3_K[5120 5120]
-
blk.10.attn_k.weightQ3_K[5120 5120]
-
blk.10.attn_v.weightQ4_K[5120 5120]
-
blk.10.attn_output.weightQ4_K[5120 5120]
-
blk.10.ffn_gate.weightQ3_K[5120 13824]
-
blk.10.ffn_down.weightQ4_K[13824 5120]
-
blk.10.ffn_up.weightQ3_K[5120 13824]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.11.attn_q.weightQ3_K[5120 5120]
-
blk.11.attn_k.weightQ3_K[5120 5120]
-
blk.11.attn_v.weightQ4_K[5120 5120]
-
blk.11.attn_output.weightQ4_K[5120 5120]
-
blk.11.ffn_gate.weightQ3_K[5120 13824]
-
blk.11.ffn_down.weightQ4_K[13824 5120]
-
blk.11.ffn_up.weightQ3_K[5120 13824]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.12.attn_q.weightQ3_K[5120 5120]
-
blk.12.attn_k.weightQ3_K[5120 5120]
-
blk.12.attn_v.weightQ4_K[5120 5120]
-
blk.12.attn_output.weightQ4_K[5120 5120]
-
blk.12.ffn_gate.weightQ3_K[5120 13824]
-
blk.12.ffn_down.weightQ4_K[13824 5120]
-
blk.12.ffn_up.weightQ3_K[5120 13824]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.13.attn_q.weightQ3_K[5120 5120]
-
blk.13.attn_k.weightQ3_K[5120 5120]
-
blk.13.attn_v.weightQ4_K[5120 5120]
-
blk.13.attn_output.weightQ4_K[5120 5120]
-
blk.13.ffn_gate.weightQ3_K[5120 13824]
-
blk.13.ffn_down.weightQ4_K[13824 5120]
-
blk.13.ffn_up.weightQ3_K[5120 13824]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.14.attn_q.weightQ3_K[5120 5120]
-
blk.14.attn_k.weightQ3_K[5120 5120]
-
blk.14.attn_v.weightQ4_K[5120 5120]
-
blk.14.attn_output.weightQ4_K[5120 5120]
-
blk.14.ffn_gate.weightQ3_K[5120 13824]
-
blk.14.ffn_down.weightQ4_K[13824 5120]
-
blk.14.ffn_up.weightQ3_K[5120 13824]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.15.attn_q.weightQ3_K[5120 5120]
-
blk.15.attn_k.weightQ3_K[5120 5120]
-
blk.15.attn_v.weightQ4_K[5120 5120]
-
blk.15.attn_output.weightQ4_K[5120 5120]
-
blk.15.ffn_gate.weightQ3_K[5120 13824]
-
blk.15.ffn_down.weightQ4_K[13824 5120]
-
blk.15.ffn_up.weightQ3_K[5120 13824]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.16.attn_q.weightQ3_K[5120 5120]
-
blk.16.attn_k.weightQ3_K[5120 5120]
-
blk.16.attn_v.weightQ4_K[5120 5120]
-
blk.16.attn_output.weightQ4_K[5120 5120]
-
blk.16.ffn_gate.weightQ3_K[5120 13824]
-
blk.16.ffn_down.weightQ4_K[13824 5120]
-
blk.16.ffn_up.weightQ3_K[5120 13824]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.17.attn_q.weightQ3_K[5120 5120]
-
blk.17.attn_k.weightQ3_K[5120 5120]
-
blk.17.attn_v.weightQ4_K[5120 5120]
-
blk.17.attn_output.weightQ4_K[5120 5120]
-
blk.17.ffn_gate.weightQ3_K[5120 13824]
-
blk.17.ffn_down.weightQ4_K[13824 5120]
-
blk.17.ffn_up.weightQ3_K[5120 13824]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.18.attn_q.weightQ3_K[5120 5120]
-
blk.18.attn_k.weightQ3_K[5120 5120]
-
blk.18.attn_v.weightQ4_K[5120 5120]
-
blk.18.attn_output.weightQ4_K[5120 5120]
-
blk.18.ffn_gate.weightQ3_K[5120 13824]
-
blk.18.ffn_down.weightQ4_K[13824 5120]
-
blk.18.ffn_up.weightQ3_K[5120 13824]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.19.attn_q.weightQ3_K[5120 5120]
-
blk.19.attn_k.weightQ3_K[5120 5120]
-
blk.19.attn_v.weightQ4_K[5120 5120]
-
blk.19.attn_output.weightQ4_K[5120 5120]
-
blk.19.ffn_gate.weightQ3_K[5120 13824]
-
blk.19.ffn_down.weightQ4_K[13824 5120]
-
blk.19.ffn_up.weightQ3_K[5120 13824]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.20.attn_q.weightQ3_K[5120 5120]
-
blk.20.attn_k.weightQ3_K[5120 5120]
-
blk.20.attn_v.weightQ4_K[5120 5120]
-
blk.20.attn_output.weightQ4_K[5120 5120]
-
blk.20.ffn_gate.weightQ3_K[5120 13824]
-
blk.20.ffn_down.weightQ4_K[13824 5120]
-
blk.20.ffn_up.weightQ3_K[5120 13824]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.21.attn_q.weightQ3_K[5120 5120]
-
blk.21.attn_k.weightQ3_K[5120 5120]
-
blk.21.attn_v.weightQ4_K[5120 5120]
-
blk.21.attn_output.weightQ4_K[5120 5120]
-
blk.21.ffn_gate.weightQ3_K[5120 13824]
-
blk.21.ffn_down.weightQ4_K[13824 5120]
-
blk.21.ffn_up.weightQ3_K[5120 13824]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.22.attn_q.weightQ3_K[5120 5120]
-
blk.22.attn_k.weightQ3_K[5120 5120]
-
blk.22.attn_v.weightQ4_K[5120 5120]
-
blk.22.attn_output.weightQ4_K[5120 5120]
-
blk.22.ffn_gate.weightQ3_K[5120 13824]
-
blk.22.ffn_down.weightQ4_K[13824 5120]
-
blk.22.ffn_up.weightQ3_K[5120 13824]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.23.attn_q.weightQ3_K[5120 5120]
-
blk.23.attn_k.weightQ3_K[5120 5120]
-
blk.23.attn_v.weightQ4_K[5120 5120]
-
blk.23.attn_output.weightQ4_K[5120 5120]
-
blk.23.ffn_gate.weightQ3_K[5120 13824]
-
blk.23.ffn_down.weightQ4_K[13824 5120]
-
blk.23.ffn_up.weightQ3_K[5120 13824]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.24.attn_q.weightQ3_K[5120 5120]
-
blk.24.attn_k.weightQ3_K[5120 5120]
-
blk.24.attn_v.weightQ4_K[5120 5120]
-
blk.24.attn_output.weightQ4_K[5120 5120]
-
blk.24.ffn_gate.weightQ3_K[5120 13824]
-
blk.24.ffn_down.weightQ4_K[13824 5120]
-
blk.24.ffn_up.weightQ3_K[5120 13824]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.25.attn_q.weightQ3_K[5120 5120]
-
blk.25.attn_k.weightQ3_K[5120 5120]
-
blk.25.attn_v.weightQ4_K[5120 5120]
-
blk.25.attn_output.weightQ4_K[5120 5120]
-
blk.25.ffn_gate.weightQ3_K[5120 13824]
-
blk.25.ffn_down.weightQ4_K[13824 5120]
-
blk.25.ffn_up.weightQ3_K[5120 13824]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.26.attn_q.weightQ3_K[5120 5120]
-
blk.26.attn_k.weightQ3_K[5120 5120]
-
blk.26.attn_v.weightQ4_K[5120 5120]
-
blk.26.attn_output.weightQ4_K[5120 5120]
-
blk.26.ffn_gate.weightQ3_K[5120 13824]
-
blk.26.ffn_down.weightQ4_K[13824 5120]
-
blk.26.ffn_up.weightQ3_K[5120 13824]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.27.attn_q.weightQ3_K[5120 5120]
-
blk.27.attn_k.weightQ3_K[5120 5120]
-
blk.27.attn_v.weightQ4_K[5120 5120]
-
blk.27.attn_output.weightQ4_K[5120 5120]
-
blk.27.ffn_gate.weightQ3_K[5120 13824]
-
blk.27.ffn_down.weightQ4_K[13824 5120]
-
blk.27.ffn_up.weightQ3_K[5120 13824]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.28.attn_q.weightQ3_K[5120 5120]
-
blk.28.attn_k.weightQ3_K[5120 5120]
-
blk.28.attn_v.weightQ4_K[5120 5120]
-
blk.28.attn_output.weightQ4_K[5120 5120]
-
blk.28.ffn_gate.weightQ3_K[5120 13824]
-
blk.28.ffn_down.weightQ4_K[13824 5120]
-
blk.28.ffn_up.weightQ3_K[5120 13824]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.29.attn_q.weightQ3_K[5120 5120]
-
blk.29.attn_k.weightQ3_K[5120 5120]
-
blk.29.attn_v.weightQ4_K[5120 5120]
-
blk.29.attn_output.weightQ4_K[5120 5120]
-
blk.29.ffn_gate.weightQ3_K[5120 13824]
-
blk.29.ffn_down.weightQ4_K[13824 5120]
-
blk.29.ffn_up.weightQ3_K[5120 13824]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.30.attn_q.weightQ3_K[5120 5120]
-
blk.30.attn_k.weightQ3_K[5120 5120]
-
blk.30.attn_v.weightQ4_K[5120 5120]
-
blk.30.attn_output.weightQ4_K[5120 5120]
-
blk.30.ffn_gate.weightQ3_K[5120 13824]
-
blk.30.ffn_down.weightQ4_K[13824 5120]
-
blk.30.ffn_up.weightQ3_K[5120 13824]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.31.attn_q.weightQ3_K[5120 5120]
-
blk.31.attn_k.weightQ3_K[5120 5120]
-
blk.31.attn_v.weightQ4_K[5120 5120]
-
blk.31.attn_output.weightQ4_K[5120 5120]
-
blk.31.ffn_gate.weightQ3_K[5120 13824]
-
blk.31.ffn_down.weightQ4_K[13824 5120]
-
blk.31.ffn_up.weightQ3_K[5120 13824]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.32.attn_q.weightQ3_K[5120 5120]
-
blk.32.attn_k.weightQ3_K[5120 5120]
-
blk.32.attn_v.weightQ4_K[5120 5120]
-
blk.32.attn_output.weightQ4_K[5120 5120]
-
blk.32.ffn_gate.weightQ3_K[5120 13824]
-
blk.32.ffn_down.weightQ4_K[13824 5120]
-
blk.32.ffn_up.weightQ3_K[5120 13824]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.33.attn_q.weightQ3_K[5120 5120]
-
blk.33.attn_k.weightQ3_K[5120 5120]
-
blk.33.attn_v.weightQ4_K[5120 5120]
-
blk.33.attn_output.weightQ4_K[5120 5120]
-
blk.33.ffn_gate.weightQ3_K[5120 13824]
-
blk.33.ffn_down.weightQ4_K[13824 5120]
-
blk.33.ffn_up.weightQ3_K[5120 13824]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.34.attn_q.weightQ3_K[5120 5120]
-
blk.34.attn_k.weightQ3_K[5120 5120]
-
blk.34.attn_v.weightQ4_K[5120 5120]
-
blk.34.attn_output.weightQ4_K[5120 5120]
-
blk.34.ffn_gate.weightQ3_K[5120 13824]
-
blk.34.ffn_down.weightQ4_K[13824 5120]
-
blk.34.ffn_up.weightQ3_K[5120 13824]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.35.attn_q.weightQ3_K[5120 5120]
-
blk.35.attn_k.weightQ3_K[5120 5120]
-
blk.35.attn_v.weightQ4_K[5120 5120]
-
blk.35.attn_output.weightQ4_K[5120 5120]
-
blk.35.ffn_gate.weightQ3_K[5120 13824]
-
blk.35.ffn_down.weightQ4_K[13824 5120]
-
blk.35.ffn_up.weightQ3_K[5120 13824]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.36.attn_q.weightQ3_K[5120 5120]
-
blk.36.attn_k.weightQ3_K[5120 5120]
-
blk.36.attn_v.weightQ4_K[5120 5120]
-
blk.36.attn_output.weightQ4_K[5120 5120]
-
blk.36.ffn_gate.weightQ3_K[5120 13824]
-
blk.36.ffn_down.weightQ4_K[13824 5120]
-
blk.36.ffn_up.weightQ3_K[5120 13824]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.37.attn_q.weightQ3_K[5120 5120]
-
blk.37.attn_k.weightQ3_K[5120 5120]
-
blk.37.attn_v.weightQ4_K[5120 5120]
-
blk.37.attn_output.weightQ4_K[5120 5120]
-
blk.37.ffn_gate.weightQ3_K[5120 13824]
-
blk.37.ffn_down.weightQ4_K[13824 5120]
-
blk.37.ffn_up.weightQ3_K[5120 13824]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.38.attn_q.weightQ3_K[5120 5120]
-
blk.38.attn_k.weightQ3_K[5120 5120]
-
blk.38.attn_v.weightQ4_K[5120 5120]
-
blk.38.attn_output.weightQ4_K[5120 5120]
-
blk.38.ffn_gate.weightQ3_K[5120 13824]
-
blk.38.ffn_down.weightQ4_K[13824 5120]
-
blk.38.ffn_up.weightQ3_K[5120 13824]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.39.attn_q.weightQ3_K[5120 5120]
-
blk.39.attn_k.weightQ3_K[5120 5120]
-
blk.39.attn_v.weightQ4_K[5120 5120]
-
blk.39.attn_output.weightQ4_K[5120 5120]
-
blk.39.ffn_gate.weightQ3_K[5120 13824]
-
blk.39.ffn_down.weightQ4_K[13824 5120]
-
blk.39.ffn_up.weightQ3_K[5120 13824]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.ffn_norm.weightF32[5120]
-
output_norm.weightF32[5120]
-
output.weightQ6_K[5120 32032]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39