7B
28 Pulls Updated 5 months ago
dbe8bd6a4b45 · 5.5GB
-
general.architecturellama
-
general.file_typeQ6_K
-
llama.attention.head_count32
-
llama.attention.head_count_kv32
-
llama.attention.layer_norm_rms_epsilon1e-06
-
llama.block_count32
-
llama.context_length16384
-
llama.embedding_length4096
-
llama.feed_forward_length11008
-
llama.rope.dimension_count128
-
llama.rope.freq_base100000
-
llama.rope.scaling.factor4
-
llama.rope.scaling.typelinear
-
tokenizer.ggml.bos_token_id32013
-
tokenizer.ggml.eos_token_id32021
-
tokenizer.ggml.merges[Ġ Ġ Ġ t Ġ a i n h e ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id32014
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weightQ6_K[4096 32256]
-
blk.0.attn_norm.weightF32[4096]
-
blk.0.ffn_down.weightQ6_K[11008 4096]
-
blk.0.ffn_gate.weightQ6_K[4096 11008]
-
blk.0.ffn_up.weightQ6_K[4096 11008]
-
blk.0.ffn_norm.weightF32[4096]
-
blk.0.attn_k.weightQ6_K[4096 4096]
-
blk.0.attn_output.weightQ6_K[4096 4096]
-
blk.0.attn_q.weightQ6_K[4096 4096]
-
blk.0.attn_v.weightQ6_K[4096 4096]
-
blk.1.attn_norm.weightF32[4096]
-
blk.1.ffn_down.weightQ6_K[11008 4096]
-
blk.1.ffn_gate.weightQ6_K[4096 11008]
-
blk.1.ffn_up.weightQ6_K[4096 11008]
-
blk.1.ffn_norm.weightF32[4096]
-
blk.1.attn_k.weightQ6_K[4096 4096]
-
blk.1.attn_output.weightQ6_K[4096 4096]
-
blk.1.attn_q.weightQ6_K[4096 4096]
-
blk.1.attn_v.weightQ6_K[4096 4096]
-
blk.2.attn_norm.weightF32[4096]
-
blk.2.ffn_down.weightQ6_K[11008 4096]
-
blk.2.ffn_gate.weightQ6_K[4096 11008]
-
blk.2.ffn_up.weightQ6_K[4096 11008]
-
blk.2.ffn_norm.weightF32[4096]
-
blk.2.attn_k.weightQ6_K[4096 4096]
-
blk.2.attn_output.weightQ6_K[4096 4096]
-
blk.2.attn_q.weightQ6_K[4096 4096]
-
blk.2.attn_v.weightQ6_K[4096 4096]
-
blk.3.attn_norm.weightF32[4096]
-
blk.3.ffn_down.weightQ6_K[11008 4096]
-
blk.3.ffn_gate.weightQ6_K[4096 11008]
-
blk.3.ffn_up.weightQ6_K[4096 11008]
-
blk.3.ffn_norm.weightF32[4096]
-
blk.3.attn_k.weightQ6_K[4096 4096]
-
blk.3.attn_output.weightQ6_K[4096 4096]
-
blk.3.attn_q.weightQ6_K[4096 4096]
-
blk.3.attn_v.weightQ6_K[4096 4096]
-
blk.4.attn_norm.weightF32[4096]
-
blk.4.ffn_down.weightQ6_K[11008 4096]
-
blk.4.ffn_gate.weightQ6_K[4096 11008]
-
blk.4.ffn_up.weightQ6_K[4096 11008]
-
blk.4.ffn_norm.weightF32[4096]
-
blk.4.attn_k.weightQ6_K[4096 4096]
-
blk.4.attn_output.weightQ6_K[4096 4096]
-
blk.4.attn_q.weightQ6_K[4096 4096]
-
blk.4.attn_v.weightQ6_K[4096 4096]
-
blk.5.attn_norm.weightF32[4096]
-
blk.5.ffn_down.weightQ6_K[11008 4096]
-
blk.5.ffn_gate.weightQ6_K[4096 11008]
-
blk.5.ffn_up.weightQ6_K[4096 11008]
-
blk.5.ffn_norm.weightF32[4096]
-
blk.5.attn_k.weightQ6_K[4096 4096]
-
blk.5.attn_output.weightQ6_K[4096 4096]
-
blk.5.attn_q.weightQ6_K[4096 4096]
-
blk.5.attn_v.weightQ6_K[4096 4096]
-
blk.6.attn_norm.weightF32[4096]
-
blk.6.ffn_down.weightQ6_K[11008 4096]
-
blk.6.ffn_gate.weightQ6_K[4096 11008]
-
blk.6.ffn_up.weightQ6_K[4096 11008]
-
blk.6.ffn_norm.weightF32[4096]
-
blk.6.attn_k.weightQ6_K[4096 4096]
-
blk.6.attn_output.weightQ6_K[4096 4096]
-
blk.6.attn_q.weightQ6_K[4096 4096]
-
blk.6.attn_v.weightQ6_K[4096 4096]
-
blk.7.attn_norm.weightF32[4096]
-
blk.7.ffn_down.weightQ6_K[11008 4096]
-
blk.7.ffn_gate.weightQ6_K[4096 11008]
-
blk.7.ffn_up.weightQ6_K[4096 11008]
-
blk.7.ffn_norm.weightF32[4096]
-
blk.7.attn_k.weightQ6_K[4096 4096]
-
blk.7.attn_output.weightQ6_K[4096 4096]
-
blk.7.attn_q.weightQ6_K[4096 4096]
-
blk.7.attn_v.weightQ6_K[4096 4096]
-
blk.8.attn_norm.weightF32[4096]
-
blk.8.ffn_down.weightQ6_K[11008 4096]
-
blk.8.ffn_gate.weightQ6_K[4096 11008]
-
blk.8.ffn_up.weightQ6_K[4096 11008]
-
blk.8.ffn_norm.weightF32[4096]
-
blk.8.attn_k.weightQ6_K[4096 4096]
-
blk.8.attn_output.weightQ6_K[4096 4096]
-
blk.8.attn_q.weightQ6_K[4096 4096]
-
blk.8.attn_v.weightQ6_K[4096 4096]
-
blk.9.attn_norm.weightF32[4096]
-
blk.9.ffn_down.weightQ6_K[11008 4096]
-
blk.9.ffn_gate.weightQ6_K[4096 11008]
-
blk.9.ffn_up.weightQ6_K[4096 11008]
-
blk.9.ffn_norm.weightF32[4096]
-
blk.9.attn_k.weightQ6_K[4096 4096]
-
blk.9.attn_output.weightQ6_K[4096 4096]
-
blk.9.attn_q.weightQ6_K[4096 4096]
-
blk.9.attn_v.weightQ6_K[4096 4096]
-
blk.10.attn_norm.weightF32[4096]
-
blk.10.ffn_down.weightQ6_K[11008 4096]
-
blk.10.ffn_gate.weightQ6_K[4096 11008]
-
blk.10.ffn_up.weightQ6_K[4096 11008]
-
blk.10.ffn_norm.weightF32[4096]
-
blk.10.attn_k.weightQ6_K[4096 4096]
-
blk.10.attn_output.weightQ6_K[4096 4096]
-
blk.10.attn_q.weightQ6_K[4096 4096]
-
blk.10.attn_v.weightQ6_K[4096 4096]
-
blk.11.attn_norm.weightF32[4096]
-
blk.11.ffn_down.weightQ6_K[11008 4096]
-
blk.11.ffn_gate.weightQ6_K[4096 11008]
-
blk.11.ffn_up.weightQ6_K[4096 11008]
-
blk.11.ffn_norm.weightF32[4096]
-
blk.11.attn_k.weightQ6_K[4096 4096]
-
blk.11.attn_output.weightQ6_K[4096 4096]
-
blk.11.attn_q.weightQ6_K[4096 4096]
-
blk.11.attn_v.weightQ6_K[4096 4096]
-
blk.12.attn_norm.weightF32[4096]
-
blk.12.ffn_down.weightQ6_K[11008 4096]
-
blk.12.ffn_gate.weightQ6_K[4096 11008]
-
blk.12.ffn_up.weightQ6_K[4096 11008]
-
blk.12.ffn_norm.weightF32[4096]
-
blk.12.attn_k.weightQ6_K[4096 4096]
-
blk.12.attn_output.weightQ6_K[4096 4096]
-
blk.12.attn_q.weightQ6_K[4096 4096]
-
blk.12.attn_v.weightQ6_K[4096 4096]
-
blk.13.attn_norm.weightF32[4096]
-
blk.13.ffn_down.weightQ6_K[11008 4096]
-
blk.13.ffn_gate.weightQ6_K[4096 11008]
-
blk.13.ffn_up.weightQ6_K[4096 11008]
-
blk.13.ffn_norm.weightF32[4096]
-
blk.13.attn_k.weightQ6_K[4096 4096]
-
blk.13.attn_output.weightQ6_K[4096 4096]
-
blk.13.attn_q.weightQ6_K[4096 4096]
-
blk.13.attn_v.weightQ6_K[4096 4096]
-
blk.14.attn_norm.weightF32[4096]
-
blk.14.ffn_down.weightQ6_K[11008 4096]
-
blk.14.ffn_gate.weightQ6_K[4096 11008]
-
blk.14.ffn_up.weightQ6_K[4096 11008]
-
blk.14.ffn_norm.weightF32[4096]
-
blk.14.attn_k.weightQ6_K[4096 4096]
-
blk.14.attn_output.weightQ6_K[4096 4096]
-
blk.14.attn_q.weightQ6_K[4096 4096]
-
blk.14.attn_v.weightQ6_K[4096 4096]
-
blk.15.attn_norm.weightF32[4096]
-
blk.15.ffn_down.weightQ6_K[11008 4096]
-
blk.15.ffn_gate.weightQ6_K[4096 11008]
-
blk.15.ffn_up.weightQ6_K[4096 11008]
-
blk.15.ffn_norm.weightF32[4096]
-
blk.15.attn_k.weightQ6_K[4096 4096]
-
blk.15.attn_output.weightQ6_K[4096 4096]
-
blk.15.attn_q.weightQ6_K[4096 4096]
-
blk.15.attn_v.weightQ6_K[4096 4096]
-
blk.16.attn_norm.weightF32[4096]
-
blk.16.ffn_down.weightQ6_K[11008 4096]
-
blk.16.ffn_gate.weightQ6_K[4096 11008]
-
blk.16.ffn_up.weightQ6_K[4096 11008]
-
blk.16.ffn_norm.weightF32[4096]
-
blk.16.attn_k.weightQ6_K[4096 4096]
-
blk.16.attn_output.weightQ6_K[4096 4096]
-
blk.16.attn_q.weightQ6_K[4096 4096]
-
blk.16.attn_v.weightQ6_K[4096 4096]
-
blk.17.attn_norm.weightF32[4096]
-
blk.17.ffn_down.weightQ6_K[11008 4096]
-
blk.17.ffn_gate.weightQ6_K[4096 11008]
-
blk.17.ffn_up.weightQ6_K[4096 11008]
-
blk.17.ffn_norm.weightF32[4096]
-
blk.17.attn_k.weightQ6_K[4096 4096]
-
blk.17.attn_output.weightQ6_K[4096 4096]
-
blk.17.attn_q.weightQ6_K[4096 4096]
-
blk.17.attn_v.weightQ6_K[4096 4096]
-
blk.18.attn_norm.weightF32[4096]
-
blk.18.ffn_down.weightQ6_K[11008 4096]
-
blk.18.ffn_gate.weightQ6_K[4096 11008]
-
blk.18.ffn_up.weightQ6_K[4096 11008]
-
blk.18.ffn_norm.weightF32[4096]
-
blk.18.attn_k.weightQ6_K[4096 4096]
-
blk.18.attn_output.weightQ6_K[4096 4096]
-
blk.18.attn_q.weightQ6_K[4096 4096]
-
blk.18.attn_v.weightQ6_K[4096 4096]
-
blk.19.attn_norm.weightF32[4096]
-
blk.19.ffn_down.weightQ6_K[11008 4096]
-
blk.19.ffn_gate.weightQ6_K[4096 11008]
-
blk.19.ffn_up.weightQ6_K[4096 11008]
-
blk.19.ffn_norm.weightF32[4096]
-
blk.19.attn_k.weightQ6_K[4096 4096]
-
blk.19.attn_output.weightQ6_K[4096 4096]
-
blk.19.attn_q.weightQ6_K[4096 4096]
-
blk.19.attn_v.weightQ6_K[4096 4096]
-
blk.20.attn_norm.weightF32[4096]
-
blk.20.ffn_down.weightQ6_K[11008 4096]
-
blk.20.ffn_gate.weightQ6_K[4096 11008]
-
blk.20.ffn_up.weightQ6_K[4096 11008]
-
blk.20.ffn_norm.weightF32[4096]
-
blk.20.attn_k.weightQ6_K[4096 4096]
-
blk.20.attn_output.weightQ6_K[4096 4096]
-
blk.20.attn_q.weightQ6_K[4096 4096]
-
blk.20.attn_v.weightQ6_K[4096 4096]
-
blk.21.attn_norm.weightF32[4096]
-
blk.21.ffn_down.weightQ6_K[11008 4096]
-
blk.21.ffn_gate.weightQ6_K[4096 11008]
-
blk.21.ffn_up.weightQ6_K[4096 11008]
-
blk.21.ffn_norm.weightF32[4096]
-
blk.21.attn_k.weightQ6_K[4096 4096]
-
blk.21.attn_output.weightQ6_K[4096 4096]
-
blk.21.attn_q.weightQ6_K[4096 4096]
-
blk.21.attn_v.weightQ6_K[4096 4096]
-
blk.22.attn_norm.weightF32[4096]
-
blk.22.ffn_down.weightQ6_K[11008 4096]
-
blk.22.ffn_gate.weightQ6_K[4096 11008]
-
blk.22.ffn_up.weightQ6_K[4096 11008]
-
blk.22.ffn_norm.weightF32[4096]
-
blk.22.attn_k.weightQ6_K[4096 4096]
-
blk.22.attn_output.weightQ6_K[4096 4096]
-
blk.22.attn_q.weightQ6_K[4096 4096]
-
blk.22.attn_v.weightQ6_K[4096 4096]
-
blk.23.attn_norm.weightF32[4096]
-
blk.23.ffn_down.weightQ6_K[11008 4096]
-
blk.23.ffn_gate.weightQ6_K[4096 11008]
-
blk.23.ffn_up.weightQ6_K[4096 11008]
-
blk.23.ffn_norm.weightF32[4096]
-
blk.23.attn_k.weightQ6_K[4096 4096]
-
blk.23.attn_output.weightQ6_K[4096 4096]
-
blk.23.attn_q.weightQ6_K[4096 4096]
-
blk.23.attn_v.weightQ6_K[4096 4096]
-
blk.24.attn_norm.weightF32[4096]
-
blk.24.ffn_down.weightQ6_K[11008 4096]
-
blk.24.ffn_gate.weightQ6_K[4096 11008]
-
blk.24.ffn_up.weightQ6_K[4096 11008]
-
blk.24.ffn_norm.weightF32[4096]
-
blk.24.attn_k.weightQ6_K[4096 4096]
-
blk.24.attn_output.weightQ6_K[4096 4096]
-
blk.24.attn_q.weightQ6_K[4096 4096]
-
blk.24.attn_v.weightQ6_K[4096 4096]
-
blk.25.attn_norm.weightF32[4096]
-
blk.25.ffn_down.weightQ6_K[11008 4096]
-
blk.25.ffn_gate.weightQ6_K[4096 11008]
-
blk.25.ffn_up.weightQ6_K[4096 11008]
-
blk.25.ffn_norm.weightF32[4096]
-
blk.25.attn_k.weightQ6_K[4096 4096]
-
blk.25.attn_output.weightQ6_K[4096 4096]
-
blk.25.attn_q.weightQ6_K[4096 4096]
-
blk.25.attn_v.weightQ6_K[4096 4096]
-
blk.26.attn_norm.weightF32[4096]
-
blk.26.ffn_down.weightQ6_K[11008 4096]
-
blk.26.ffn_gate.weightQ6_K[4096 11008]
-
blk.26.ffn_up.weightQ6_K[4096 11008]
-
blk.26.ffn_norm.weightF32[4096]
-
blk.26.attn_k.weightQ6_K[4096 4096]
-
blk.26.attn_output.weightQ6_K[4096 4096]
-
blk.26.attn_q.weightQ6_K[4096 4096]
-
blk.26.attn_v.weightQ6_K[4096 4096]
-
blk.27.attn_norm.weightF32[4096]
-
blk.27.ffn_down.weightQ6_K[11008 4096]
-
blk.27.ffn_gate.weightQ6_K[4096 11008]
-
blk.27.ffn_up.weightQ6_K[4096 11008]
-
blk.27.ffn_norm.weightF32[4096]
-
blk.27.attn_k.weightQ6_K[4096 4096]
-
blk.27.attn_output.weightQ6_K[4096 4096]
-
blk.27.attn_q.weightQ6_K[4096 4096]
-
blk.27.attn_v.weightQ6_K[4096 4096]
-
blk.28.attn_norm.weightF32[4096]
-
blk.28.ffn_down.weightQ6_K[11008 4096]
-
blk.28.ffn_gate.weightQ6_K[4096 11008]
-
blk.28.ffn_up.weightQ6_K[4096 11008]
-
blk.28.ffn_norm.weightF32[4096]
-
blk.28.attn_k.weightQ6_K[4096 4096]
-
blk.28.attn_output.weightQ6_K[4096 4096]
-
blk.28.attn_q.weightQ6_K[4096 4096]
-
blk.28.attn_v.weightQ6_K[4096 4096]
-
blk.29.attn_norm.weightF32[4096]
-
blk.29.ffn_down.weightQ6_K[11008 4096]
-
blk.29.ffn_gate.weightQ6_K[4096 11008]
-
blk.29.ffn_up.weightQ6_K[4096 11008]
-
blk.29.ffn_norm.weightF32[4096]
-
blk.29.attn_k.weightQ6_K[4096 4096]
-
blk.29.attn_output.weightQ6_K[4096 4096]
-
blk.29.attn_q.weightQ6_K[4096 4096]
-
blk.29.attn_v.weightQ6_K[4096 4096]
-
blk.30.attn_norm.weightF32[4096]
-
blk.30.ffn_down.weightQ6_K[11008 4096]
-
blk.30.ffn_gate.weightQ6_K[4096 11008]
-
blk.30.ffn_up.weightQ6_K[4096 11008]
-
blk.30.ffn_norm.weightF32[4096]
-
blk.30.attn_k.weightQ6_K[4096 4096]
-
blk.30.attn_output.weightQ6_K[4096 4096]
-
blk.30.attn_q.weightQ6_K[4096 4096]
-
blk.30.attn_v.weightQ6_K[4096 4096]
-
blk.31.attn_norm.weightF32[4096]
-
blk.31.ffn_down.weightQ6_K[11008 4096]
-
blk.31.ffn_gate.weightQ6_K[4096 11008]
-
blk.31.ffn_up.weightQ6_K[4096 11008]
-
blk.31.ffn_norm.weightF32[4096]
-
blk.31.attn_k.weightQ6_K[4096 4096]
-
blk.31.attn_output.weightQ6_K[4096 4096]
-
blk.31.attn_q.weightQ6_K[4096 4096]
-
blk.31.attn_v.weightQ6_K[4096 4096]
-
output.weightQ6_K[4096 32256]
-
output_norm.weightF32[4096]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31