latest
5.5GB
7B
290 Pulls Updated 6 months ago
ad82c8dd7157 · 5.5GB
-
general.architecturellama
-
general.file_typeQ6_K
-
llama.attention.head_count32
-
llama.attention.head_count_kv32
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count32
-
llama.context_length4096
-
llama.embedding_length4096
-
llama.feed_forward_length11008
-
llama.rope.dimension_count128
-
llama.rope.freq_base10000
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id32000
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[2 3 3 6 6 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> <0x00> <0x01> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ6_K[4096 32001]
-
blk.0.attn_q.weightQ6_K[4096 4096]
-
blk.0.attn_k.weightQ6_K[4096 4096]
-
blk.0.attn_v.weightQ6_K[4096 4096]
-
blk.0.attn_output.weightQ6_K[4096 4096]
-
blk.0.ffn_gate.weightQ6_K[4096 11008]
-
blk.0.ffn_up.weightQ6_K[4096 11008]
-
blk.0.ffn_down.weightQ6_K[11008 4096]
-
blk.0.attn_norm.weightF32[4096]
-
blk.0.ffn_norm.weightF32[4096]
-
blk.1.attn_q.weightQ6_K[4096 4096]
-
blk.1.attn_k.weightQ6_K[4096 4096]
-
blk.1.attn_v.weightQ6_K[4096 4096]
-
blk.1.attn_output.weightQ6_K[4096 4096]
-
blk.1.ffn_gate.weightQ6_K[4096 11008]
-
blk.1.ffn_up.weightQ6_K[4096 11008]
-
blk.1.ffn_down.weightQ6_K[11008 4096]
-
blk.1.attn_norm.weightF32[4096]
-
blk.1.ffn_norm.weightF32[4096]
-
blk.2.attn_q.weightQ6_K[4096 4096]
-
blk.2.attn_k.weightQ6_K[4096 4096]
-
blk.2.attn_v.weightQ6_K[4096 4096]
-
blk.2.attn_output.weightQ6_K[4096 4096]
-
blk.2.ffn_gate.weightQ6_K[4096 11008]
-
blk.2.ffn_up.weightQ6_K[4096 11008]
-
blk.2.ffn_down.weightQ6_K[11008 4096]
-
blk.2.attn_norm.weightF32[4096]
-
blk.2.ffn_norm.weightF32[4096]
-
blk.3.attn_q.weightQ6_K[4096 4096]
-
blk.3.attn_k.weightQ6_K[4096 4096]
-
blk.3.attn_v.weightQ6_K[4096 4096]
-
blk.3.attn_output.weightQ6_K[4096 4096]
-
blk.3.ffn_gate.weightQ6_K[4096 11008]
-
blk.3.ffn_up.weightQ6_K[4096 11008]
-
blk.3.ffn_down.weightQ6_K[11008 4096]
-
blk.3.attn_norm.weightF32[4096]
-
blk.3.ffn_norm.weightF32[4096]
-
blk.4.attn_q.weightQ6_K[4096 4096]
-
blk.4.attn_k.weightQ6_K[4096 4096]
-
blk.4.attn_v.weightQ6_K[4096 4096]
-
blk.4.attn_output.weightQ6_K[4096 4096]
-
blk.4.ffn_gate.weightQ6_K[4096 11008]
-
blk.4.ffn_up.weightQ6_K[4096 11008]
-
blk.4.ffn_down.weightQ6_K[11008 4096]
-
blk.4.attn_norm.weightF32[4096]
-
blk.4.ffn_norm.weightF32[4096]
-
blk.5.attn_q.weightQ6_K[4096 4096]
-
blk.5.attn_k.weightQ6_K[4096 4096]
-
blk.5.attn_v.weightQ6_K[4096 4096]
-
blk.5.attn_output.weightQ6_K[4096 4096]
-
blk.5.ffn_gate.weightQ6_K[4096 11008]
-
blk.5.ffn_up.weightQ6_K[4096 11008]
-
blk.5.ffn_down.weightQ6_K[11008 4096]
-
blk.5.attn_norm.weightF32[4096]
-
blk.5.ffn_norm.weightF32[4096]
-
blk.6.attn_q.weightQ6_K[4096 4096]
-
blk.6.attn_k.weightQ6_K[4096 4096]
-
blk.6.attn_v.weightQ6_K[4096 4096]
-
blk.6.attn_output.weightQ6_K[4096 4096]
-
blk.6.ffn_gate.weightQ6_K[4096 11008]
-
blk.6.ffn_up.weightQ6_K[4096 11008]
-
blk.6.ffn_down.weightQ6_K[11008 4096]
-
blk.6.attn_norm.weightF32[4096]
-
blk.6.ffn_norm.weightF32[4096]
-
blk.7.attn_q.weightQ6_K[4096 4096]
-
blk.7.attn_k.weightQ6_K[4096 4096]
-
blk.7.attn_v.weightQ6_K[4096 4096]
-
blk.7.attn_output.weightQ6_K[4096 4096]
-
blk.7.ffn_gate.weightQ6_K[4096 11008]
-
blk.7.ffn_up.weightQ6_K[4096 11008]
-
blk.7.ffn_down.weightQ6_K[11008 4096]
-
blk.7.attn_norm.weightF32[4096]
-
blk.7.ffn_norm.weightF32[4096]
-
blk.8.attn_q.weightQ6_K[4096 4096]
-
blk.8.attn_k.weightQ6_K[4096 4096]
-
blk.8.attn_v.weightQ6_K[4096 4096]
-
blk.8.attn_output.weightQ6_K[4096 4096]
-
blk.8.ffn_gate.weightQ6_K[4096 11008]
-
blk.8.ffn_up.weightQ6_K[4096 11008]
-
blk.8.ffn_down.weightQ6_K[11008 4096]
-
blk.8.attn_norm.weightF32[4096]
-
blk.8.ffn_norm.weightF32[4096]
-
blk.9.attn_q.weightQ6_K[4096 4096]
-
blk.9.attn_k.weightQ6_K[4096 4096]
-
blk.9.attn_v.weightQ6_K[4096 4096]
-
blk.9.attn_output.weightQ6_K[4096 4096]
-
blk.9.ffn_gate.weightQ6_K[4096 11008]
-
blk.9.ffn_up.weightQ6_K[4096 11008]
-
blk.9.ffn_down.weightQ6_K[11008 4096]
-
blk.9.attn_norm.weightF32[4096]
-
blk.9.ffn_norm.weightF32[4096]
-
blk.10.attn_q.weightQ6_K[4096 4096]
-
blk.10.attn_k.weightQ6_K[4096 4096]
-
blk.10.attn_v.weightQ6_K[4096 4096]
-
blk.10.attn_output.weightQ6_K[4096 4096]
-
blk.10.ffn_gate.weightQ6_K[4096 11008]
-
blk.10.ffn_up.weightQ6_K[4096 11008]
-
blk.10.ffn_down.weightQ6_K[11008 4096]
-
blk.10.attn_norm.weightF32[4096]
-
blk.10.ffn_norm.weightF32[4096]
-
blk.11.attn_q.weightQ6_K[4096 4096]
-
blk.11.attn_k.weightQ6_K[4096 4096]
-
blk.11.attn_v.weightQ6_K[4096 4096]
-
blk.11.attn_output.weightQ6_K[4096 4096]
-
blk.11.ffn_gate.weightQ6_K[4096 11008]
-
blk.11.ffn_up.weightQ6_K[4096 11008]
-
blk.11.ffn_down.weightQ6_K[11008 4096]
-
blk.11.attn_norm.weightF32[4096]
-
blk.11.ffn_norm.weightF32[4096]
-
blk.12.attn_q.weightQ6_K[4096 4096]
-
blk.12.attn_k.weightQ6_K[4096 4096]
-
blk.12.attn_v.weightQ6_K[4096 4096]
-
blk.12.attn_output.weightQ6_K[4096 4096]
-
blk.12.ffn_gate.weightQ6_K[4096 11008]
-
blk.12.ffn_up.weightQ6_K[4096 11008]
-
blk.12.ffn_down.weightQ6_K[11008 4096]
-
blk.12.attn_norm.weightF32[4096]
-
blk.12.ffn_norm.weightF32[4096]
-
blk.13.attn_q.weightQ6_K[4096 4096]
-
blk.13.attn_k.weightQ6_K[4096 4096]
-
blk.13.attn_v.weightQ6_K[4096 4096]
-
blk.13.attn_output.weightQ6_K[4096 4096]
-
blk.13.ffn_gate.weightQ6_K[4096 11008]
-
blk.13.ffn_up.weightQ6_K[4096 11008]
-
blk.13.ffn_down.weightQ6_K[11008 4096]
-
blk.13.attn_norm.weightF32[4096]
-
blk.13.ffn_norm.weightF32[4096]
-
blk.14.attn_q.weightQ6_K[4096 4096]
-
blk.14.attn_k.weightQ6_K[4096 4096]
-
blk.14.attn_v.weightQ6_K[4096 4096]
-
blk.14.attn_output.weightQ6_K[4096 4096]
-
blk.14.ffn_gate.weightQ6_K[4096 11008]
-
blk.14.ffn_up.weightQ6_K[4096 11008]
-
blk.14.ffn_down.weightQ6_K[11008 4096]
-
blk.14.attn_norm.weightF32[4096]
-
blk.14.ffn_norm.weightF32[4096]
-
blk.15.attn_q.weightQ6_K[4096 4096]
-
blk.15.attn_k.weightQ6_K[4096 4096]
-
blk.15.attn_v.weightQ6_K[4096 4096]
-
blk.15.attn_output.weightQ6_K[4096 4096]
-
blk.15.ffn_gate.weightQ6_K[4096 11008]
-
blk.15.ffn_up.weightQ6_K[4096 11008]
-
blk.15.ffn_down.weightQ6_K[11008 4096]
-
blk.15.attn_norm.weightF32[4096]
-
blk.15.ffn_norm.weightF32[4096]
-
blk.16.attn_q.weightQ6_K[4096 4096]
-
blk.16.attn_k.weightQ6_K[4096 4096]
-
blk.16.attn_v.weightQ6_K[4096 4096]
-
blk.16.attn_output.weightQ6_K[4096 4096]
-
blk.16.ffn_gate.weightQ6_K[4096 11008]
-
blk.16.ffn_up.weightQ6_K[4096 11008]
-
blk.16.ffn_down.weightQ6_K[11008 4096]
-
blk.16.attn_norm.weightF32[4096]
-
blk.16.ffn_norm.weightF32[4096]
-
blk.17.attn_q.weightQ6_K[4096 4096]
-
blk.17.attn_k.weightQ6_K[4096 4096]
-
blk.17.attn_v.weightQ6_K[4096 4096]
-
blk.17.attn_output.weightQ6_K[4096 4096]
-
blk.17.ffn_gate.weightQ6_K[4096 11008]
-
blk.17.ffn_up.weightQ6_K[4096 11008]
-
blk.17.ffn_down.weightQ6_K[11008 4096]
-
blk.17.attn_norm.weightF32[4096]
-
blk.17.ffn_norm.weightF32[4096]
-
blk.18.attn_q.weightQ6_K[4096 4096]
-
blk.18.attn_k.weightQ6_K[4096 4096]
-
blk.18.attn_v.weightQ6_K[4096 4096]
-
blk.18.attn_output.weightQ6_K[4096 4096]
-
blk.18.ffn_gate.weightQ6_K[4096 11008]
-
blk.18.ffn_up.weightQ6_K[4096 11008]
-
blk.18.ffn_down.weightQ6_K[11008 4096]
-
blk.18.attn_norm.weightF32[4096]
-
blk.18.ffn_norm.weightF32[4096]
-
blk.19.attn_q.weightQ6_K[4096 4096]
-
blk.19.attn_k.weightQ6_K[4096 4096]
-
blk.19.attn_v.weightQ6_K[4096 4096]
-
blk.19.attn_output.weightQ6_K[4096 4096]
-
blk.19.ffn_gate.weightQ6_K[4096 11008]
-
blk.19.ffn_up.weightQ6_K[4096 11008]
-
blk.19.ffn_down.weightQ6_K[11008 4096]
-
blk.19.attn_norm.weightF32[4096]
-
blk.19.ffn_norm.weightF32[4096]
-
blk.20.attn_q.weightQ6_K[4096 4096]
-
blk.20.attn_k.weightQ6_K[4096 4096]
-
blk.20.attn_v.weightQ6_K[4096 4096]
-
blk.20.attn_output.weightQ6_K[4096 4096]
-
blk.20.ffn_gate.weightQ6_K[4096 11008]
-
blk.20.ffn_up.weightQ6_K[4096 11008]
-
blk.20.ffn_down.weightQ6_K[11008 4096]
-
blk.20.attn_norm.weightF32[4096]
-
blk.20.ffn_norm.weightF32[4096]
-
blk.21.attn_q.weightQ6_K[4096 4096]
-
blk.21.attn_k.weightQ6_K[4096 4096]
-
blk.21.attn_v.weightQ6_K[4096 4096]
-
blk.21.attn_output.weightQ6_K[4096 4096]
-
blk.21.ffn_gate.weightQ6_K[4096 11008]
-
blk.21.ffn_up.weightQ6_K[4096 11008]
-
blk.21.ffn_down.weightQ6_K[11008 4096]
-
blk.21.attn_norm.weightF32[4096]
-
blk.21.ffn_norm.weightF32[4096]
-
blk.22.attn_q.weightQ6_K[4096 4096]
-
blk.22.attn_k.weightQ6_K[4096 4096]
-
blk.22.attn_v.weightQ6_K[4096 4096]
-
blk.22.attn_output.weightQ6_K[4096 4096]
-
blk.22.ffn_gate.weightQ6_K[4096 11008]
-
blk.22.ffn_up.weightQ6_K[4096 11008]
-
blk.22.ffn_down.weightQ6_K[11008 4096]
-
blk.22.attn_norm.weightF32[4096]
-
blk.22.ffn_norm.weightF32[4096]
-
blk.23.attn_q.weightQ6_K[4096 4096]
-
blk.23.attn_k.weightQ6_K[4096 4096]
-
blk.23.attn_v.weightQ6_K[4096 4096]
-
blk.23.attn_output.weightQ6_K[4096 4096]
-
blk.23.ffn_gate.weightQ6_K[4096 11008]
-
blk.23.ffn_up.weightQ6_K[4096 11008]
-
blk.23.ffn_down.weightQ6_K[11008 4096]
-
blk.23.attn_norm.weightF32[4096]
-
blk.23.ffn_norm.weightF32[4096]
-
blk.24.attn_q.weightQ6_K[4096 4096]
-
blk.24.attn_k.weightQ6_K[4096 4096]
-
blk.24.attn_v.weightQ6_K[4096 4096]
-
blk.24.attn_output.weightQ6_K[4096 4096]
-
blk.24.ffn_gate.weightQ6_K[4096 11008]
-
blk.24.ffn_up.weightQ6_K[4096 11008]
-
blk.24.ffn_down.weightQ6_K[11008 4096]
-
blk.24.attn_norm.weightF32[4096]
-
blk.24.ffn_norm.weightF32[4096]
-
blk.25.attn_q.weightQ6_K[4096 4096]
-
blk.25.attn_k.weightQ6_K[4096 4096]
-
blk.25.attn_v.weightQ6_K[4096 4096]
-
blk.25.attn_output.weightQ6_K[4096 4096]
-
blk.25.ffn_gate.weightQ6_K[4096 11008]
-
blk.25.ffn_up.weightQ6_K[4096 11008]
-
blk.25.ffn_down.weightQ6_K[11008 4096]
-
blk.25.attn_norm.weightF32[4096]
-
blk.25.ffn_norm.weightF32[4096]
-
blk.26.attn_q.weightQ6_K[4096 4096]
-
blk.26.attn_k.weightQ6_K[4096 4096]
-
blk.26.attn_v.weightQ6_K[4096 4096]
-
blk.26.attn_output.weightQ6_K[4096 4096]
-
blk.26.ffn_gate.weightQ6_K[4096 11008]
-
blk.26.ffn_up.weightQ6_K[4096 11008]
-
blk.26.ffn_down.weightQ6_K[11008 4096]
-
blk.26.attn_norm.weightF32[4096]
-
blk.26.ffn_norm.weightF32[4096]
-
blk.27.attn_q.weightQ6_K[4096 4096]
-
blk.27.attn_k.weightQ6_K[4096 4096]
-
blk.27.attn_v.weightQ6_K[4096 4096]
-
blk.27.attn_output.weightQ6_K[4096 4096]
-
blk.27.ffn_gate.weightQ6_K[4096 11008]
-
blk.27.ffn_up.weightQ6_K[4096 11008]
-
blk.27.ffn_down.weightQ6_K[11008 4096]
-
blk.27.attn_norm.weightF32[4096]
-
blk.27.ffn_norm.weightF32[4096]
-
blk.28.attn_q.weightQ6_K[4096 4096]
-
blk.28.attn_k.weightQ6_K[4096 4096]
-
blk.28.attn_v.weightQ6_K[4096 4096]
-
blk.28.attn_output.weightQ6_K[4096 4096]
-
blk.28.ffn_gate.weightQ6_K[4096 11008]
-
blk.28.ffn_up.weightQ6_K[4096 11008]
-
blk.28.ffn_down.weightQ6_K[11008 4096]
-
blk.28.attn_norm.weightF32[4096]
-
blk.28.ffn_norm.weightF32[4096]
-
blk.29.attn_q.weightQ6_K[4096 4096]
-
blk.29.attn_k.weightQ6_K[4096 4096]
-
blk.29.attn_v.weightQ6_K[4096 4096]
-
blk.29.attn_output.weightQ6_K[4096 4096]
-
blk.29.ffn_gate.weightQ6_K[4096 11008]
-
blk.29.ffn_up.weightQ6_K[4096 11008]
-
blk.29.ffn_down.weightQ6_K[11008 4096]
-
blk.29.attn_norm.weightF32[4096]
-
blk.29.ffn_norm.weightF32[4096]
-
blk.30.attn_q.weightQ6_K[4096 4096]
-
blk.30.attn_k.weightQ6_K[4096 4096]
-
blk.30.attn_v.weightQ6_K[4096 4096]
-
blk.30.attn_output.weightQ6_K[4096 4096]
-
blk.30.ffn_gate.weightQ6_K[4096 11008]
-
blk.30.ffn_up.weightQ6_K[4096 11008]
-
blk.30.ffn_down.weightQ6_K[11008 4096]
-
blk.30.attn_norm.weightF32[4096]
-
blk.30.ffn_norm.weightF32[4096]
-
blk.31.attn_q.weightQ6_K[4096 4096]
-
blk.31.attn_k.weightQ6_K[4096 4096]
-
blk.31.attn_v.weightQ6_K[4096 4096]
-
blk.31.attn_output.weightQ6_K[4096 4096]
-
blk.31.ffn_gate.weightQ6_K[4096 11008]
-
blk.31.ffn_up.weightQ6_K[4096 11008]
-
blk.31.ffn_down.weightQ6_K[11008 4096]
-
blk.31.attn_norm.weightF32[4096]
-
blk.31.ffn_norm.weightF32[4096]
-
output_norm.weightF32[4096]
-
output.weightQ6_K[4096 32001]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31