7 Pulls Updated 9 days ago
1e0621ec3bf9 · 28GB
-
general.architecturellama
-
general.file_typeF16
-
llama.attention.head_count40
-
llama.attention.head_count_kv10
-
llama.attention.key_length128
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.attention.value_length128
-
llama.block_count40
-
llama.context_length4096
-
llama.embedding_length5120
-
llama.feed_forward_length17920
-
llama.rope.dimension_count128
-
llama.rope.freq_base10000
-
llama.vocab_size32064
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id32000
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id32009
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000 -1000 -1000 0 0 ...]
-
tokenizer.ggml.token_type[3 3 4 6 6 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> <0x00> <0x01> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightF16[5120 32064]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.ffn_down.weightF16[17920 5120]
-
blk.0.ffn_gate.weightF16[5120 17920]
-
blk.0.ffn_up.weightF16[5120 17920]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.0.attn_k.weightF16[5120 1280]
-
blk.0.attn_output.weightF16[5120 5120]
-
blk.0.attn_q.weightF16[5120 5120]
-
blk.0.attn_v.weightF16[5120 1280]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.ffn_down.weightF16[17920 5120]
-
blk.1.ffn_gate.weightF16[5120 17920]
-
blk.1.ffn_up.weightF16[5120 17920]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.attn_k.weightF16[5120 1280]
-
blk.1.attn_output.weightF16[5120 5120]
-
blk.1.attn_q.weightF16[5120 5120]
-
blk.1.attn_v.weightF16[5120 1280]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.ffn_down.weightF16[17920 5120]
-
blk.2.ffn_gate.weightF16[5120 17920]
-
blk.2.ffn_up.weightF16[5120 17920]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.2.attn_k.weightF16[5120 1280]
-
blk.2.attn_output.weightF16[5120 5120]
-
blk.2.attn_q.weightF16[5120 5120]
-
blk.2.attn_v.weightF16[5120 1280]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.ffn_down.weightF16[17920 5120]
-
blk.3.ffn_gate.weightF16[5120 17920]
-
blk.3.ffn_up.weightF16[5120 17920]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.3.attn_k.weightF16[5120 1280]
-
blk.3.attn_output.weightF16[5120 5120]
-
blk.3.attn_q.weightF16[5120 5120]
-
blk.3.attn_v.weightF16[5120 1280]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.ffn_down.weightF16[17920 5120]
-
blk.4.ffn_gate.weightF16[5120 17920]
-
blk.4.ffn_up.weightF16[5120 17920]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.4.attn_k.weightF16[5120 1280]
-
blk.4.attn_output.weightF16[5120 5120]
-
blk.4.attn_q.weightF16[5120 5120]
-
blk.4.attn_v.weightF16[5120 1280]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.ffn_down.weightF16[17920 5120]
-
blk.5.ffn_gate.weightF16[5120 17920]
-
blk.5.ffn_up.weightF16[5120 17920]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.attn_k.weightF16[5120 1280]
-
blk.5.attn_output.weightF16[5120 5120]
-
blk.5.attn_q.weightF16[5120 5120]
-
blk.5.attn_v.weightF16[5120 1280]
-
blk.6.ffn_gate.weightF16[5120 17920]
-
blk.6.ffn_up.weightF16[5120 17920]
-
blk.6.attn_k.weightF16[5120 1280]
-
blk.6.attn_output.weightF16[5120 5120]
-
blk.6.attn_q.weightF16[5120 5120]
-
blk.6.attn_v.weightF16[5120 1280]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.ffn_down.weightF16[17920 5120]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.ffn_down.weightF16[17920 5120]
-
blk.7.ffn_gate.weightF16[5120 17920]
-
blk.7.ffn_up.weightF16[5120 17920]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.attn_k.weightF16[5120 1280]
-
blk.7.attn_output.weightF16[5120 5120]
-
blk.7.attn_q.weightF16[5120 5120]
-
blk.7.attn_v.weightF16[5120 1280]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.ffn_down.weightF16[17920 5120]
-
blk.8.ffn_gate.weightF16[5120 17920]
-
blk.8.ffn_up.weightF16[5120 17920]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.8.attn_k.weightF16[5120 1280]
-
blk.8.attn_output.weightF16[5120 5120]
-
blk.8.attn_q.weightF16[5120 5120]
-
blk.8.attn_v.weightF16[5120 1280]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.ffn_down.weightF16[17920 5120]
-
blk.9.ffn_gate.weightF16[5120 17920]
-
blk.9.ffn_up.weightF16[5120 17920]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.attn_k.weightF16[5120 1280]
-
blk.9.attn_output.weightF16[5120 5120]
-
blk.9.attn_q.weightF16[5120 5120]
-
blk.9.attn_v.weightF16[5120 1280]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.ffn_down.weightF16[17920 5120]
-
blk.10.ffn_gate.weightF16[5120 17920]
-
blk.10.ffn_up.weightF16[5120 17920]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.10.attn_k.weightF16[5120 1280]
-
blk.10.attn_output.weightF16[5120 5120]
-
blk.10.attn_q.weightF16[5120 5120]
-
blk.10.attn_v.weightF16[5120 1280]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.ffn_down.weightF16[17920 5120]
-
blk.11.ffn_gate.weightF16[5120 17920]
-
blk.11.ffn_up.weightF16[5120 17920]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.attn_k.weightF16[5120 1280]
-
blk.11.attn_output.weightF16[5120 5120]
-
blk.11.attn_q.weightF16[5120 5120]
-
blk.11.attn_v.weightF16[5120 1280]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.ffn_down.weightF16[17920 5120]
-
blk.12.ffn_gate.weightF16[5120 17920]
-
blk.12.ffn_up.weightF16[5120 17920]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.12.attn_k.weightF16[5120 1280]
-
blk.12.attn_output.weightF16[5120 5120]
-
blk.12.attn_q.weightF16[5120 5120]
-
blk.12.attn_v.weightF16[5120 1280]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.ffn_down.weightF16[17920 5120]
-
blk.13.ffn_gate.weightF16[5120 17920]
-
blk.13.ffn_up.weightF16[5120 17920]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.13.attn_k.weightF16[5120 1280]
-
blk.13.attn_output.weightF16[5120 5120]
-
blk.13.attn_q.weightF16[5120 5120]
-
blk.13.attn_v.weightF16[5120 1280]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.ffn_down.weightF16[17920 5120]
-
blk.14.ffn_gate.weightF16[5120 17920]
-
blk.14.ffn_up.weightF16[5120 17920]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.14.attn_k.weightF16[5120 1280]
-
blk.14.attn_output.weightF16[5120 5120]
-
blk.14.attn_q.weightF16[5120 5120]
-
blk.14.attn_v.weightF16[5120 1280]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.ffn_down.weightF16[17920 5120]
-
blk.15.ffn_gate.weightF16[5120 17920]
-
blk.15.ffn_up.weightF16[5120 17920]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.15.attn_k.weightF16[5120 1280]
-
blk.15.attn_output.weightF16[5120 5120]
-
blk.15.attn_q.weightF16[5120 5120]
-
blk.15.attn_v.weightF16[5120 1280]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.ffn_down.weightF16[17920 5120]
-
blk.16.ffn_gate.weightF16[5120 17920]
-
blk.16.ffn_up.weightF16[5120 17920]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.16.attn_k.weightF16[5120 1280]
-
blk.16.attn_output.weightF16[5120 5120]
-
blk.16.attn_q.weightF16[5120 5120]
-
blk.16.attn_v.weightF16[5120 1280]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.ffn_down.weightF16[17920 5120]
-
blk.17.ffn_gate.weightF16[5120 17920]
-
blk.17.ffn_up.weightF16[5120 17920]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.attn_k.weightF16[5120 1280]
-
blk.17.attn_output.weightF16[5120 5120]
-
blk.17.attn_q.weightF16[5120 5120]
-
blk.17.attn_v.weightF16[5120 1280]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.ffn_down.weightF16[17920 5120]
-
blk.18.ffn_gate.weightF16[5120 17920]
-
blk.18.ffn_up.weightF16[5120 17920]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.18.attn_k.weightF16[5120 1280]
-
blk.18.attn_output.weightF16[5120 5120]
-
blk.18.attn_q.weightF16[5120 5120]
-
blk.18.attn_v.weightF16[5120 1280]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.ffn_down.weightF16[17920 5120]
-
blk.19.ffn_gate.weightF16[5120 17920]
-
blk.19.ffn_up.weightF16[5120 17920]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.attn_k.weightF16[5120 1280]
-
blk.19.attn_output.weightF16[5120 5120]
-
blk.19.attn_q.weightF16[5120 5120]
-
blk.19.attn_v.weightF16[5120 1280]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.ffn_down.weightF16[17920 5120]
-
blk.20.ffn_gate.weightF16[5120 17920]
-
blk.20.ffn_up.weightF16[5120 17920]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.20.attn_k.weightF16[5120 1280]
-
blk.20.attn_output.weightF16[5120 5120]
-
blk.20.attn_q.weightF16[5120 5120]
-
blk.20.attn_v.weightF16[5120 1280]
-
blk.21.attn_k.weightF16[5120 1280]
-
blk.21.attn_output.weightF16[5120 5120]
-
blk.21.attn_q.weightF16[5120 5120]
-
blk.21.attn_v.weightF16[5120 1280]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.ffn_down.weightF16[17920 5120]
-
blk.21.ffn_gate.weightF16[5120 17920]
-
blk.21.ffn_up.weightF16[5120 17920]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.ffn_down.weightF16[17920 5120]
-
blk.22.ffn_gate.weightF16[5120 17920]
-
blk.22.ffn_up.weightF16[5120 17920]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.22.attn_k.weightF16[5120 1280]
-
blk.22.attn_output.weightF16[5120 5120]
-
blk.22.attn_q.weightF16[5120 5120]
-
blk.22.attn_v.weightF16[5120 1280]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.ffn_down.weightF16[17920 5120]
-
blk.23.ffn_gate.weightF16[5120 17920]
-
blk.23.ffn_up.weightF16[5120 17920]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.23.attn_k.weightF16[5120 1280]
-
blk.23.attn_output.weightF16[5120 5120]
-
blk.23.attn_q.weightF16[5120 5120]
-
blk.23.attn_v.weightF16[5120 1280]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.ffn_down.weightF16[17920 5120]
-
blk.24.ffn_gate.weightF16[5120 17920]
-
blk.24.ffn_up.weightF16[5120 17920]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.24.attn_k.weightF16[5120 1280]
-
blk.24.attn_output.weightF16[5120 5120]
-
blk.24.attn_q.weightF16[5120 5120]
-
blk.24.attn_v.weightF16[5120 1280]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.ffn_down.weightF16[17920 5120]
-
blk.25.ffn_gate.weightF16[5120 17920]
-
blk.25.ffn_up.weightF16[5120 17920]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.attn_k.weightF16[5120 1280]
-
blk.25.attn_output.weightF16[5120 5120]
-
blk.25.attn_q.weightF16[5120 5120]
-
blk.25.attn_v.weightF16[5120 1280]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.ffn_down.weightF16[17920 5120]
-
blk.26.ffn_gate.weightF16[5120 17920]
-
blk.26.ffn_up.weightF16[5120 17920]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.26.attn_k.weightF16[5120 1280]
-
blk.26.attn_output.weightF16[5120 5120]
-
blk.26.attn_q.weightF16[5120 5120]
-
blk.26.attn_v.weightF16[5120 1280]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.ffn_down.weightF16[17920 5120]
-
blk.27.ffn_gate.weightF16[5120 17920]
-
blk.27.ffn_up.weightF16[5120 17920]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.attn_k.weightF16[5120 1280]
-
blk.27.attn_output.weightF16[5120 5120]
-
blk.27.attn_q.weightF16[5120 5120]
-
blk.27.attn_v.weightF16[5120 1280]
-
blk.28.ffn_gate.weightF16[5120 17920]
-
blk.28.attn_k.weightF16[5120 1280]
-
blk.28.attn_output.weightF16[5120 5120]
-
blk.28.attn_q.weightF16[5120 5120]
-
blk.28.attn_v.weightF16[5120 1280]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.ffn_down.weightF16[17920 5120]
-
blk.28.ffn_up.weightF16[5120 17920]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.ffn_down.weightF16[17920 5120]
-
blk.29.ffn_gate.weightF16[5120 17920]
-
blk.29.ffn_up.weightF16[5120 17920]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.attn_k.weightF16[5120 1280]
-
blk.29.attn_output.weightF16[5120 5120]
-
blk.29.attn_q.weightF16[5120 5120]
-
blk.29.attn_v.weightF16[5120 1280]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.ffn_down.weightF16[17920 5120]
-
blk.30.ffn_gate.weightF16[5120 17920]
-
blk.30.ffn_up.weightF16[5120 17920]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.30.attn_k.weightF16[5120 1280]
-
blk.30.attn_output.weightF16[5120 5120]
-
blk.30.attn_q.weightF16[5120 5120]
-
blk.30.attn_v.weightF16[5120 1280]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.ffn_down.weightF16[17920 5120]
-
blk.31.ffn_gate.weightF16[5120 17920]
-
blk.31.ffn_up.weightF16[5120 17920]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.attn_k.weightF16[5120 1280]
-
blk.31.attn_output.weightF16[5120 5120]
-
blk.31.attn_q.weightF16[5120 5120]
-
blk.31.attn_v.weightF16[5120 1280]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.ffn_down.weightF16[17920 5120]
-
blk.32.ffn_gate.weightF16[5120 17920]
-
blk.32.ffn_up.weightF16[5120 17920]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.32.attn_k.weightF16[5120 1280]
-
blk.32.attn_output.weightF16[5120 5120]
-
blk.32.attn_q.weightF16[5120 5120]
-
blk.32.attn_v.weightF16[5120 1280]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.ffn_down.weightF16[17920 5120]
-
blk.33.ffn_gate.weightF16[5120 17920]
-
blk.33.ffn_up.weightF16[5120 17920]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.33.attn_k.weightF16[5120 1280]
-
blk.33.attn_output.weightF16[5120 5120]
-
blk.33.attn_q.weightF16[5120 5120]
-
blk.33.attn_v.weightF16[5120 1280]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.ffn_down.weightF16[17920 5120]
-
blk.34.ffn_gate.weightF16[5120 17920]
-
blk.34.ffn_up.weightF16[5120 17920]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.34.attn_k.weightF16[5120 1280]
-
blk.34.attn_output.weightF16[5120 5120]
-
blk.34.attn_q.weightF16[5120 5120]
-
blk.34.attn_v.weightF16[5120 1280]
-
blk.35.ffn_gate.weightF16[5120 17920]
-
blk.35.ffn_up.weightF16[5120 17920]
-
blk.35.attn_k.weightF16[5120 1280]
-
blk.35.attn_output.weightF16[5120 5120]
-
blk.35.attn_q.weightF16[5120 5120]
-
blk.35.attn_v.weightF16[5120 1280]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.ffn_down.weightF16[17920 5120]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.ffn_down.weightF16[17920 5120]
-
blk.36.ffn_gate.weightF16[5120 17920]
-
blk.36.ffn_up.weightF16[5120 17920]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.36.attn_k.weightF16[5120 1280]
-
blk.36.attn_output.weightF16[5120 5120]
-
blk.36.attn_q.weightF16[5120 5120]
-
blk.36.attn_v.weightF16[5120 1280]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.ffn_down.weightF16[17920 5120]
-
blk.37.ffn_gate.weightF16[5120 17920]
-
blk.37.ffn_up.weightF16[5120 17920]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.attn_k.weightF16[5120 1280]
-
blk.37.attn_output.weightF16[5120 5120]
-
blk.37.attn_q.weightF16[5120 5120]
-
blk.37.attn_v.weightF16[5120 1280]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.ffn_down.weightF16[17920 5120]
-
blk.38.ffn_gate.weightF16[5120 17920]
-
blk.38.ffn_up.weightF16[5120 17920]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.38.attn_k.weightF16[5120 1280]
-
blk.38.attn_output.weightF16[5120 5120]
-
blk.38.attn_q.weightF16[5120 5120]
-
blk.38.attn_v.weightF16[5120 1280]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.ffn_down.weightF16[17920 5120]
-
blk.39.ffn_gate.weightF16[5120 17920]
-
blk.39.ffn_up.weightF16[5120 17920]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.attn_k.weightF16[5120 1280]
-
blk.39.attn_output.weightF16[5120 5120]
-
blk.39.attn_q.weightF16[5120 5120]
-
blk.39.attn_v.weightF16[5120 1280]
-
output.weightF16[5120 32064]
-
output_norm.weightF32[5120]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39