Derived from uukuguy/speechless-coder-ds-6.7b
7B
11 Pulls Updated 6 months ago
8131379b04d8 · 7.2GB
-
general.architecturellama
-
general.file_typeQ8_0
-
llama.attention.head_count32
-
llama.attention.head_count_kv32
-
llama.attention.layer_norm_rms_epsilon1e-06
-
llama.block_count32
-
llama.context_length16384
-
llama.embedding_length4096
-
llama.feed_forward_length11008
-
llama.rope.dimension_count128
-
llama.rope.freq_base100000
-
llama.rope.scaling.factor4
-
llama.rope.scaling.typelinear
-
tokenizer.ggml.bos_token_id32013
-
tokenizer.ggml.eos_token_id32014
-
tokenizer.ggml.merges[Ġ Ġ Ġ t Ġ a i n h e ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id32014
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weightQ8_0[4096 32256]
-
blk.0.attn_q.weightQ8_0[4096 4096]
-
blk.0.attn_k.weightQ8_0[4096 4096]
-
blk.0.attn_v.weightQ8_0[4096 4096]
-
blk.0.attn_output.weightQ8_0[4096 4096]
-
blk.0.ffn_gate.weightQ8_0[4096 11008]
-
blk.0.ffn_up.weightQ8_0[4096 11008]
-
blk.0.ffn_down.weightQ8_0[11008 4096]
-
blk.0.attn_norm.weightF32[4096]
-
blk.0.ffn_norm.weightF32[4096]
-
blk.1.attn_q.weightQ8_0[4096 4096]
-
blk.1.attn_k.weightQ8_0[4096 4096]
-
blk.1.attn_v.weightQ8_0[4096 4096]
-
blk.1.attn_output.weightQ8_0[4096 4096]
-
blk.1.ffn_gate.weightQ8_0[4096 11008]
-
blk.1.ffn_up.weightQ8_0[4096 11008]
-
blk.1.ffn_down.weightQ8_0[11008 4096]
-
blk.1.attn_norm.weightF32[4096]
-
blk.1.ffn_norm.weightF32[4096]
-
blk.2.attn_q.weightQ8_0[4096 4096]
-
blk.2.attn_k.weightQ8_0[4096 4096]
-
blk.2.attn_v.weightQ8_0[4096 4096]
-
blk.2.attn_output.weightQ8_0[4096 4096]
-
blk.2.ffn_gate.weightQ8_0[4096 11008]
-
blk.2.ffn_up.weightQ8_0[4096 11008]
-
blk.2.ffn_down.weightQ8_0[11008 4096]
-
blk.2.attn_norm.weightF32[4096]
-
blk.2.ffn_norm.weightF32[4096]
-
blk.3.attn_q.weightQ8_0[4096 4096]
-
blk.3.attn_k.weightQ8_0[4096 4096]
-
blk.3.attn_v.weightQ8_0[4096 4096]
-
blk.3.attn_output.weightQ8_0[4096 4096]
-
blk.3.ffn_gate.weightQ8_0[4096 11008]
-
blk.3.ffn_up.weightQ8_0[4096 11008]
-
blk.3.ffn_down.weightQ8_0[11008 4096]
-
blk.3.attn_norm.weightF32[4096]
-
blk.3.ffn_norm.weightF32[4096]
-
blk.4.attn_q.weightQ8_0[4096 4096]
-
blk.4.attn_k.weightQ8_0[4096 4096]
-
blk.4.attn_v.weightQ8_0[4096 4096]
-
blk.4.attn_output.weightQ8_0[4096 4096]
-
blk.4.ffn_gate.weightQ8_0[4096 11008]
-
blk.4.ffn_up.weightQ8_0[4096 11008]
-
blk.4.ffn_down.weightQ8_0[11008 4096]
-
blk.4.attn_norm.weightF32[4096]
-
blk.4.ffn_norm.weightF32[4096]
-
blk.5.attn_q.weightQ8_0[4096 4096]
-
blk.5.attn_k.weightQ8_0[4096 4096]
-
blk.5.attn_v.weightQ8_0[4096 4096]
-
blk.5.attn_output.weightQ8_0[4096 4096]
-
blk.5.ffn_gate.weightQ8_0[4096 11008]
-
blk.5.ffn_up.weightQ8_0[4096 11008]
-
blk.5.ffn_down.weightQ8_0[11008 4096]
-
blk.5.attn_norm.weightF32[4096]
-
blk.5.ffn_norm.weightF32[4096]
-
blk.6.attn_q.weightQ8_0[4096 4096]
-
blk.6.attn_k.weightQ8_0[4096 4096]
-
blk.6.attn_v.weightQ8_0[4096 4096]
-
blk.6.attn_output.weightQ8_0[4096 4096]
-
blk.6.ffn_gate.weightQ8_0[4096 11008]
-
blk.6.ffn_up.weightQ8_0[4096 11008]
-
blk.6.ffn_down.weightQ8_0[11008 4096]
-
blk.6.attn_norm.weightF32[4096]
-
blk.6.ffn_norm.weightF32[4096]
-
blk.7.attn_q.weightQ8_0[4096 4096]
-
blk.7.attn_k.weightQ8_0[4096 4096]
-
blk.7.attn_v.weightQ8_0[4096 4096]
-
blk.7.attn_output.weightQ8_0[4096 4096]
-
blk.7.ffn_gate.weightQ8_0[4096 11008]
-
blk.7.ffn_up.weightQ8_0[4096 11008]
-
blk.7.ffn_down.weightQ8_0[11008 4096]
-
blk.7.attn_norm.weightF32[4096]
-
blk.7.ffn_norm.weightF32[4096]
-
blk.8.attn_q.weightQ8_0[4096 4096]
-
blk.8.attn_k.weightQ8_0[4096 4096]
-
blk.8.attn_v.weightQ8_0[4096 4096]
-
blk.8.attn_output.weightQ8_0[4096 4096]
-
blk.8.ffn_gate.weightQ8_0[4096 11008]
-
blk.8.ffn_up.weightQ8_0[4096 11008]
-
blk.8.ffn_down.weightQ8_0[11008 4096]
-
blk.8.attn_norm.weightF32[4096]
-
blk.8.ffn_norm.weightF32[4096]
-
blk.9.attn_q.weightQ8_0[4096 4096]
-
blk.9.attn_k.weightQ8_0[4096 4096]
-
blk.9.attn_v.weightQ8_0[4096 4096]
-
blk.9.attn_output.weightQ8_0[4096 4096]
-
blk.9.ffn_gate.weightQ8_0[4096 11008]
-
blk.9.ffn_up.weightQ8_0[4096 11008]
-
blk.9.ffn_down.weightQ8_0[11008 4096]
-
blk.9.attn_norm.weightF32[4096]
-
blk.9.ffn_norm.weightF32[4096]
-
blk.10.attn_q.weightQ8_0[4096 4096]
-
blk.10.attn_k.weightQ8_0[4096 4096]
-
blk.10.attn_v.weightQ8_0[4096 4096]
-
blk.10.attn_output.weightQ8_0[4096 4096]
-
blk.10.ffn_gate.weightQ8_0[4096 11008]
-
blk.10.ffn_up.weightQ8_0[4096 11008]
-
blk.10.ffn_down.weightQ8_0[11008 4096]
-
blk.10.attn_norm.weightF32[4096]
-
blk.10.ffn_norm.weightF32[4096]
-
blk.11.attn_q.weightQ8_0[4096 4096]
-
blk.11.attn_k.weightQ8_0[4096 4096]
-
blk.11.attn_v.weightQ8_0[4096 4096]
-
blk.11.attn_output.weightQ8_0[4096 4096]
-
blk.11.ffn_gate.weightQ8_0[4096 11008]
-
blk.11.ffn_up.weightQ8_0[4096 11008]
-
blk.11.ffn_down.weightQ8_0[11008 4096]
-
blk.11.attn_norm.weightF32[4096]
-
blk.11.ffn_norm.weightF32[4096]
-
blk.12.attn_q.weightQ8_0[4096 4096]
-
blk.12.attn_k.weightQ8_0[4096 4096]
-
blk.12.attn_v.weightQ8_0[4096 4096]
-
blk.12.attn_output.weightQ8_0[4096 4096]
-
blk.12.ffn_gate.weightQ8_0[4096 11008]
-
blk.12.ffn_up.weightQ8_0[4096 11008]
-
blk.12.ffn_down.weightQ8_0[11008 4096]
-
blk.12.attn_norm.weightF32[4096]
-
blk.12.ffn_norm.weightF32[4096]
-
blk.13.attn_q.weightQ8_0[4096 4096]
-
blk.13.attn_k.weightQ8_0[4096 4096]
-
blk.13.attn_v.weightQ8_0[4096 4096]
-
blk.13.attn_output.weightQ8_0[4096 4096]
-
blk.13.ffn_gate.weightQ8_0[4096 11008]
-
blk.13.ffn_up.weightQ8_0[4096 11008]
-
blk.13.ffn_down.weightQ8_0[11008 4096]
-
blk.13.attn_norm.weightF32[4096]
-
blk.13.ffn_norm.weightF32[4096]
-
blk.14.attn_q.weightQ8_0[4096 4096]
-
blk.14.attn_k.weightQ8_0[4096 4096]
-
blk.14.attn_v.weightQ8_0[4096 4096]
-
blk.14.attn_output.weightQ8_0[4096 4096]
-
blk.14.ffn_gate.weightQ8_0[4096 11008]
-
blk.14.ffn_up.weightQ8_0[4096 11008]
-
blk.14.ffn_down.weightQ8_0[11008 4096]
-
blk.14.attn_norm.weightF32[4096]
-
blk.14.ffn_norm.weightF32[4096]
-
blk.15.attn_q.weightQ8_0[4096 4096]
-
blk.15.attn_k.weightQ8_0[4096 4096]
-
blk.15.attn_v.weightQ8_0[4096 4096]
-
blk.15.attn_output.weightQ8_0[4096 4096]
-
blk.15.ffn_gate.weightQ8_0[4096 11008]
-
blk.15.ffn_up.weightQ8_0[4096 11008]
-
blk.15.ffn_down.weightQ8_0[11008 4096]
-
blk.15.attn_norm.weightF32[4096]
-
blk.15.ffn_norm.weightF32[4096]
-
blk.16.attn_q.weightQ8_0[4096 4096]
-
blk.16.attn_k.weightQ8_0[4096 4096]
-
blk.16.attn_v.weightQ8_0[4096 4096]
-
blk.16.attn_output.weightQ8_0[4096 4096]
-
blk.16.ffn_gate.weightQ8_0[4096 11008]
-
blk.16.ffn_up.weightQ8_0[4096 11008]
-
blk.16.ffn_down.weightQ8_0[11008 4096]
-
blk.16.attn_norm.weightF32[4096]
-
blk.16.ffn_norm.weightF32[4096]
-
blk.17.attn_q.weightQ8_0[4096 4096]
-
blk.17.attn_k.weightQ8_0[4096 4096]
-
blk.17.attn_v.weightQ8_0[4096 4096]
-
blk.17.attn_output.weightQ8_0[4096 4096]
-
blk.17.ffn_gate.weightQ8_0[4096 11008]
-
blk.17.ffn_up.weightQ8_0[4096 11008]
-
blk.17.ffn_down.weightQ8_0[11008 4096]
-
blk.17.attn_norm.weightF32[4096]
-
blk.17.ffn_norm.weightF32[4096]
-
blk.18.attn_q.weightQ8_0[4096 4096]
-
blk.18.attn_k.weightQ8_0[4096 4096]
-
blk.18.attn_v.weightQ8_0[4096 4096]
-
blk.18.attn_output.weightQ8_0[4096 4096]
-
blk.18.ffn_gate.weightQ8_0[4096 11008]
-
blk.18.ffn_up.weightQ8_0[4096 11008]
-
blk.18.ffn_down.weightQ8_0[11008 4096]
-
blk.18.attn_norm.weightF32[4096]
-
blk.18.ffn_norm.weightF32[4096]
-
blk.19.attn_q.weightQ8_0[4096 4096]
-
blk.19.attn_k.weightQ8_0[4096 4096]
-
blk.19.attn_v.weightQ8_0[4096 4096]
-
blk.19.attn_output.weightQ8_0[4096 4096]
-
blk.19.ffn_gate.weightQ8_0[4096 11008]
-
blk.19.ffn_up.weightQ8_0[4096 11008]
-
blk.19.ffn_down.weightQ8_0[11008 4096]
-
blk.19.attn_norm.weightF32[4096]
-
blk.19.ffn_norm.weightF32[4096]
-
blk.20.attn_q.weightQ8_0[4096 4096]
-
blk.20.attn_k.weightQ8_0[4096 4096]
-
blk.20.attn_v.weightQ8_0[4096 4096]
-
blk.20.attn_output.weightQ8_0[4096 4096]
-
blk.20.ffn_gate.weightQ8_0[4096 11008]
-
blk.20.ffn_up.weightQ8_0[4096 11008]
-
blk.20.ffn_down.weightQ8_0[11008 4096]
-
blk.20.attn_norm.weightF32[4096]
-
blk.20.ffn_norm.weightF32[4096]
-
blk.21.attn_q.weightQ8_0[4096 4096]
-
blk.21.attn_k.weightQ8_0[4096 4096]
-
blk.21.attn_v.weightQ8_0[4096 4096]
-
blk.21.attn_output.weightQ8_0[4096 4096]
-
blk.21.ffn_gate.weightQ8_0[4096 11008]
-
blk.21.ffn_up.weightQ8_0[4096 11008]
-
blk.21.ffn_down.weightQ8_0[11008 4096]
-
blk.21.attn_norm.weightF32[4096]
-
blk.21.ffn_norm.weightF32[4096]
-
blk.22.attn_q.weightQ8_0[4096 4096]
-
blk.22.attn_k.weightQ8_0[4096 4096]
-
blk.22.attn_v.weightQ8_0[4096 4096]
-
blk.22.attn_output.weightQ8_0[4096 4096]
-
blk.22.ffn_gate.weightQ8_0[4096 11008]
-
blk.22.ffn_up.weightQ8_0[4096 11008]
-
blk.22.ffn_down.weightQ8_0[11008 4096]
-
blk.22.attn_norm.weightF32[4096]
-
blk.22.ffn_norm.weightF32[4096]
-
blk.23.attn_q.weightQ8_0[4096 4096]
-
blk.23.attn_k.weightQ8_0[4096 4096]
-
blk.23.attn_v.weightQ8_0[4096 4096]
-
blk.23.attn_output.weightQ8_0[4096 4096]
-
blk.23.ffn_gate.weightQ8_0[4096 11008]
-
blk.23.ffn_up.weightQ8_0[4096 11008]
-
blk.23.ffn_down.weightQ8_0[11008 4096]
-
blk.23.attn_norm.weightF32[4096]
-
blk.23.ffn_norm.weightF32[4096]
-
blk.24.attn_q.weightQ8_0[4096 4096]
-
blk.24.attn_k.weightQ8_0[4096 4096]
-
blk.24.attn_v.weightQ8_0[4096 4096]
-
blk.24.attn_output.weightQ8_0[4096 4096]
-
blk.24.ffn_gate.weightQ8_0[4096 11008]
-
blk.24.ffn_up.weightQ8_0[4096 11008]
-
blk.24.ffn_down.weightQ8_0[11008 4096]
-
blk.24.attn_norm.weightF32[4096]
-
blk.24.ffn_norm.weightF32[4096]
-
blk.25.attn_q.weightQ8_0[4096 4096]
-
blk.25.attn_k.weightQ8_0[4096 4096]
-
blk.25.attn_v.weightQ8_0[4096 4096]
-
blk.25.attn_output.weightQ8_0[4096 4096]
-
blk.25.ffn_gate.weightQ8_0[4096 11008]
-
blk.25.ffn_up.weightQ8_0[4096 11008]
-
blk.25.ffn_down.weightQ8_0[11008 4096]
-
blk.25.attn_norm.weightF32[4096]
-
blk.25.ffn_norm.weightF32[4096]
-
blk.26.attn_q.weightQ8_0[4096 4096]
-
blk.26.attn_k.weightQ8_0[4096 4096]
-
blk.26.attn_v.weightQ8_0[4096 4096]
-
blk.26.attn_output.weightQ8_0[4096 4096]
-
blk.26.ffn_gate.weightQ8_0[4096 11008]
-
blk.26.ffn_up.weightQ8_0[4096 11008]
-
blk.26.ffn_down.weightQ8_0[11008 4096]
-
blk.26.attn_norm.weightF32[4096]
-
blk.26.ffn_norm.weightF32[4096]
-
blk.27.attn_q.weightQ8_0[4096 4096]
-
blk.27.attn_k.weightQ8_0[4096 4096]
-
blk.27.attn_v.weightQ8_0[4096 4096]
-
blk.27.attn_output.weightQ8_0[4096 4096]
-
blk.27.ffn_gate.weightQ8_0[4096 11008]
-
blk.27.ffn_up.weightQ8_0[4096 11008]
-
blk.27.ffn_down.weightQ8_0[11008 4096]
-
blk.27.attn_norm.weightF32[4096]
-
blk.27.ffn_norm.weightF32[4096]
-
blk.28.attn_q.weightQ8_0[4096 4096]
-
blk.28.attn_k.weightQ8_0[4096 4096]
-
blk.28.attn_v.weightQ8_0[4096 4096]
-
blk.28.attn_output.weightQ8_0[4096 4096]
-
blk.28.ffn_gate.weightQ8_0[4096 11008]
-
blk.28.ffn_up.weightQ8_0[4096 11008]
-
blk.28.ffn_down.weightQ8_0[11008 4096]
-
blk.28.attn_norm.weightF32[4096]
-
blk.28.ffn_norm.weightF32[4096]
-
blk.29.attn_q.weightQ8_0[4096 4096]
-
blk.29.attn_k.weightQ8_0[4096 4096]
-
blk.29.attn_v.weightQ8_0[4096 4096]
-
blk.29.attn_output.weightQ8_0[4096 4096]
-
blk.29.ffn_gate.weightQ8_0[4096 11008]
-
blk.29.ffn_up.weightQ8_0[4096 11008]
-
blk.29.ffn_down.weightQ8_0[11008 4096]
-
blk.29.attn_norm.weightF32[4096]
-
blk.29.ffn_norm.weightF32[4096]
-
blk.30.attn_q.weightQ8_0[4096 4096]
-
blk.30.attn_k.weightQ8_0[4096 4096]
-
blk.30.attn_v.weightQ8_0[4096 4096]
-
blk.30.attn_output.weightQ8_0[4096 4096]
-
blk.30.ffn_gate.weightQ8_0[4096 11008]
-
blk.30.ffn_up.weightQ8_0[4096 11008]
-
blk.30.ffn_down.weightQ8_0[11008 4096]
-
blk.30.attn_norm.weightF32[4096]
-
blk.30.ffn_norm.weightF32[4096]
-
blk.31.attn_q.weightQ8_0[4096 4096]
-
blk.31.attn_k.weightQ8_0[4096 4096]
-
blk.31.attn_v.weightQ8_0[4096 4096]
-
blk.31.attn_output.weightQ8_0[4096 4096]
-
blk.31.ffn_gate.weightQ8_0[4096 11008]
-
blk.31.ffn_up.weightQ8_0[4096 11008]
-
blk.31.ffn_down.weightQ8_0[11008 4096]
-
blk.31.attn_norm.weightF32[4096]
-
blk.31.ffn_norm.weightF32[4096]
-
output_norm.weightF32[4096]
-
output.weightQ8_0[4096 32256]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31