Code
9B
1 Pull Updated 4 days ago
76f9fda937a5 · 9.4GB
-
general.architecturellama
-
general.file_typeQ8_0
-
llama.attention.head_count32
-
llama.attention.head_count_kv4
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count48
-
llama.context_length131072
-
llama.embedding_length4096
-
llama.feed_forward_length11008
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+07
-
llama.vocab_size64000
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id0
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000 -1000 -1000 0 0 ...]
-
tokenizer.ggml.token_type[3 3 3 3 3 ...]
-
tokenizer.ggml.tokens[<unk> <|startoftext|> <|endoftext|> <|Human|> <|Assistant|> ...]
-
NameTypeShape
-
token_embd.weightQ8_0[4096 64000]
-
blk.0.attn_norm.weightF32[4096]
-
blk.0.ffn_down.weightQ8_0[11008 4096]
-
blk.0.ffn_gate.weightQ8_0[4096 11008]
-
blk.0.ffn_up.weightQ8_0[4096 11008]
-
blk.0.ffn_norm.weightF32[4096]
-
blk.0.attn_k.weightQ8_0[4096 512]
-
blk.0.attn_output.weightQ8_0[4096 4096]
-
blk.0.attn_q.weightQ8_0[4096 4096]
-
blk.0.attn_v.weightQ8_0[4096 512]
-
blk.1.attn_norm.weightF32[4096]
-
blk.1.ffn_down.weightQ8_0[11008 4096]
-
blk.1.ffn_gate.weightQ8_0[4096 11008]
-
blk.1.ffn_up.weightQ8_0[4096 11008]
-
blk.1.ffn_norm.weightF32[4096]
-
blk.1.attn_k.weightQ8_0[4096 512]
-
blk.1.attn_output.weightQ8_0[4096 4096]
-
blk.1.attn_q.weightQ8_0[4096 4096]
-
blk.1.attn_v.weightQ8_0[4096 512]
-
blk.2.attn_norm.weightF32[4096]
-
blk.2.ffn_down.weightQ8_0[11008 4096]
-
blk.2.ffn_gate.weightQ8_0[4096 11008]
-
blk.2.ffn_up.weightQ8_0[4096 11008]
-
blk.2.ffn_norm.weightF32[4096]
-
blk.2.attn_k.weightQ8_0[4096 512]
-
blk.2.attn_output.weightQ8_0[4096 4096]
-
blk.2.attn_q.weightQ8_0[4096 4096]
-
blk.2.attn_v.weightQ8_0[4096 512]
-
blk.3.attn_norm.weightF32[4096]
-
blk.3.ffn_down.weightQ8_0[11008 4096]
-
blk.3.ffn_gate.weightQ8_0[4096 11008]
-
blk.3.ffn_up.weightQ8_0[4096 11008]
-
blk.3.ffn_norm.weightF32[4096]
-
blk.3.attn_k.weightQ8_0[4096 512]
-
blk.3.attn_output.weightQ8_0[4096 4096]
-
blk.3.attn_q.weightQ8_0[4096 4096]
-
blk.3.attn_v.weightQ8_0[4096 512]
-
blk.4.attn_norm.weightF32[4096]
-
blk.4.ffn_down.weightQ8_0[11008 4096]
-
blk.4.ffn_gate.weightQ8_0[4096 11008]
-
blk.4.ffn_up.weightQ8_0[4096 11008]
-
blk.4.ffn_norm.weightF32[4096]
-
blk.4.attn_k.weightQ8_0[4096 512]
-
blk.4.attn_output.weightQ8_0[4096 4096]
-
blk.4.attn_q.weightQ8_0[4096 4096]
-
blk.4.attn_v.weightQ8_0[4096 512]
-
blk.5.attn_norm.weightF32[4096]
-
blk.5.ffn_down.weightQ8_0[11008 4096]
-
blk.5.ffn_gate.weightQ8_0[4096 11008]
-
blk.5.ffn_up.weightQ8_0[4096 11008]
-
blk.5.ffn_norm.weightF32[4096]
-
blk.5.attn_k.weightQ8_0[4096 512]
-
blk.5.attn_output.weightQ8_0[4096 4096]
-
blk.5.attn_q.weightQ8_0[4096 4096]
-
blk.5.attn_v.weightQ8_0[4096 512]
-
blk.6.attn_norm.weightF32[4096]
-
blk.6.ffn_down.weightQ8_0[11008 4096]
-
blk.6.ffn_gate.weightQ8_0[4096 11008]
-
blk.6.ffn_up.weightQ8_0[4096 11008]
-
blk.6.ffn_norm.weightF32[4096]
-
blk.6.attn_k.weightQ8_0[4096 512]
-
blk.6.attn_output.weightQ8_0[4096 4096]
-
blk.6.attn_q.weightQ8_0[4096 4096]
-
blk.6.attn_v.weightQ8_0[4096 512]
-
blk.7.attn_norm.weightF32[4096]
-
blk.7.ffn_down.weightQ8_0[11008 4096]
-
blk.7.ffn_gate.weightQ8_0[4096 11008]
-
blk.7.ffn_up.weightQ8_0[4096 11008]
-
blk.7.ffn_norm.weightF32[4096]
-
blk.7.attn_k.weightQ8_0[4096 512]
-
blk.7.attn_output.weightQ8_0[4096 4096]
-
blk.7.attn_q.weightQ8_0[4096 4096]
-
blk.7.attn_v.weightQ8_0[4096 512]
-
blk.8.attn_norm.weightF32[4096]
-
blk.8.ffn_down.weightQ8_0[11008 4096]
-
blk.8.ffn_gate.weightQ8_0[4096 11008]
-
blk.8.ffn_up.weightQ8_0[4096 11008]
-
blk.8.ffn_norm.weightF32[4096]
-
blk.8.attn_k.weightQ8_0[4096 512]
-
blk.8.attn_output.weightQ8_0[4096 4096]
-
blk.8.attn_q.weightQ8_0[4096 4096]
-
blk.8.attn_v.weightQ8_0[4096 512]
-
blk.9.attn_norm.weightF32[4096]
-
blk.9.ffn_down.weightQ8_0[11008 4096]
-
blk.9.ffn_gate.weightQ8_0[4096 11008]
-
blk.9.ffn_up.weightQ8_0[4096 11008]
-
blk.9.ffn_norm.weightF32[4096]
-
blk.9.attn_k.weightQ8_0[4096 512]
-
blk.9.attn_output.weightQ8_0[4096 4096]
-
blk.9.attn_q.weightQ8_0[4096 4096]
-
blk.9.attn_v.weightQ8_0[4096 512]
-
blk.10.attn_norm.weightF32[4096]
-
blk.10.ffn_down.weightQ8_0[11008 4096]
-
blk.10.ffn_gate.weightQ8_0[4096 11008]
-
blk.10.ffn_up.weightQ8_0[4096 11008]
-
blk.10.ffn_norm.weightF32[4096]
-
blk.10.attn_k.weightQ8_0[4096 512]
-
blk.10.attn_output.weightQ8_0[4096 4096]
-
blk.10.attn_q.weightQ8_0[4096 4096]
-
blk.10.attn_v.weightQ8_0[4096 512]
-
blk.11.attn_norm.weightF32[4096]
-
blk.11.ffn_down.weightQ8_0[11008 4096]
-
blk.11.ffn_gate.weightQ8_0[4096 11008]
-
blk.11.ffn_up.weightQ8_0[4096 11008]
-
blk.11.ffn_norm.weightF32[4096]
-
blk.11.attn_k.weightQ8_0[4096 512]
-
blk.11.attn_output.weightQ8_0[4096 4096]
-
blk.11.attn_q.weightQ8_0[4096 4096]
-
blk.11.attn_v.weightQ8_0[4096 512]
-
blk.12.ffn_gate.weightQ8_0[4096 11008]
-
blk.12.ffn_up.weightQ8_0[4096 11008]
-
blk.12.attn_k.weightQ8_0[4096 512]
-
blk.12.attn_output.weightQ8_0[4096 4096]
-
blk.12.attn_q.weightQ8_0[4096 4096]
-
blk.12.attn_v.weightQ8_0[4096 512]
-
blk.12.attn_norm.weightF32[4096]
-
blk.12.ffn_down.weightQ8_0[11008 4096]
-
blk.12.ffn_norm.weightF32[4096]
-
blk.13.attn_norm.weightF32[4096]
-
blk.13.ffn_down.weightQ8_0[11008 4096]
-
blk.13.ffn_gate.weightQ8_0[4096 11008]
-
blk.13.ffn_up.weightQ8_0[4096 11008]
-
blk.13.ffn_norm.weightF32[4096]
-
blk.13.attn_k.weightQ8_0[4096 512]
-
blk.13.attn_output.weightQ8_0[4096 4096]
-
blk.13.attn_q.weightQ8_0[4096 4096]
-
blk.13.attn_v.weightQ8_0[4096 512]
-
blk.14.attn_norm.weightF32[4096]
-
blk.14.ffn_down.weightQ8_0[11008 4096]
-
blk.14.ffn_gate.weightQ8_0[4096 11008]
-
blk.14.ffn_up.weightQ8_0[4096 11008]
-
blk.14.ffn_norm.weightF32[4096]
-
blk.14.attn_k.weightQ8_0[4096 512]
-
blk.14.attn_output.weightQ8_0[4096 4096]
-
blk.14.attn_q.weightQ8_0[4096 4096]
-
blk.14.attn_v.weightQ8_0[4096 512]
-
blk.15.attn_norm.weightF32[4096]
-
blk.15.ffn_down.weightQ8_0[11008 4096]
-
blk.15.ffn_gate.weightQ8_0[4096 11008]
-
blk.15.ffn_up.weightQ8_0[4096 11008]
-
blk.15.ffn_norm.weightF32[4096]
-
blk.15.attn_k.weightQ8_0[4096 512]
-
blk.15.attn_output.weightQ8_0[4096 4096]
-
blk.15.attn_q.weightQ8_0[4096 4096]
-
blk.15.attn_v.weightQ8_0[4096 512]
-
blk.16.attn_norm.weightF32[4096]
-
blk.16.ffn_down.weightQ8_0[11008 4096]
-
blk.16.ffn_gate.weightQ8_0[4096 11008]
-
blk.16.ffn_up.weightQ8_0[4096 11008]
-
blk.16.ffn_norm.weightF32[4096]
-
blk.16.attn_k.weightQ8_0[4096 512]
-
blk.16.attn_output.weightQ8_0[4096 4096]
-
blk.16.attn_q.weightQ8_0[4096 4096]
-
blk.16.attn_v.weightQ8_0[4096 512]
-
blk.17.attn_norm.weightF32[4096]
-
blk.17.ffn_down.weightQ8_0[11008 4096]
-
blk.17.ffn_gate.weightQ8_0[4096 11008]
-
blk.17.ffn_up.weightQ8_0[4096 11008]
-
blk.17.ffn_norm.weightF32[4096]
-
blk.17.attn_k.weightQ8_0[4096 512]
-
blk.17.attn_output.weightQ8_0[4096 4096]
-
blk.17.attn_q.weightQ8_0[4096 4096]
-
blk.17.attn_v.weightQ8_0[4096 512]
-
blk.18.attn_norm.weightF32[4096]
-
blk.18.ffn_down.weightQ8_0[11008 4096]
-
blk.18.ffn_gate.weightQ8_0[4096 11008]
-
blk.18.ffn_up.weightQ8_0[4096 11008]
-
blk.18.ffn_norm.weightF32[4096]
-
blk.18.attn_k.weightQ8_0[4096 512]
-
blk.18.attn_output.weightQ8_0[4096 4096]
-
blk.18.attn_q.weightQ8_0[4096 4096]
-
blk.18.attn_v.weightQ8_0[4096 512]
-
blk.19.attn_norm.weightF32[4096]
-
blk.19.ffn_down.weightQ8_0[11008 4096]
-
blk.19.ffn_gate.weightQ8_0[4096 11008]
-
blk.19.ffn_up.weightQ8_0[4096 11008]
-
blk.19.ffn_norm.weightF32[4096]
-
blk.19.attn_k.weightQ8_0[4096 512]
-
blk.19.attn_output.weightQ8_0[4096 4096]
-
blk.19.attn_q.weightQ8_0[4096 4096]
-
blk.19.attn_v.weightQ8_0[4096 512]
-
blk.20.attn_norm.weightF32[4096]
-
blk.20.ffn_down.weightQ8_0[11008 4096]
-
blk.20.ffn_gate.weightQ8_0[4096 11008]
-
blk.20.ffn_up.weightQ8_0[4096 11008]
-
blk.20.ffn_norm.weightF32[4096]
-
blk.20.attn_k.weightQ8_0[4096 512]
-
blk.20.attn_output.weightQ8_0[4096 4096]
-
blk.20.attn_q.weightQ8_0[4096 4096]
-
blk.20.attn_v.weightQ8_0[4096 512]
-
blk.21.attn_norm.weightF32[4096]
-
blk.21.ffn_down.weightQ8_0[11008 4096]
-
blk.21.ffn_gate.weightQ8_0[4096 11008]
-
blk.21.ffn_up.weightQ8_0[4096 11008]
-
blk.21.ffn_norm.weightF32[4096]
-
blk.21.attn_k.weightQ8_0[4096 512]
-
blk.21.attn_output.weightQ8_0[4096 4096]
-
blk.21.attn_q.weightQ8_0[4096 4096]
-
blk.21.attn_v.weightQ8_0[4096 512]
-
blk.22.attn_norm.weightF32[4096]
-
blk.22.ffn_down.weightQ8_0[11008 4096]
-
blk.22.ffn_gate.weightQ8_0[4096 11008]
-
blk.22.ffn_up.weightQ8_0[4096 11008]
-
blk.22.ffn_norm.weightF32[4096]
-
blk.22.attn_k.weightQ8_0[4096 512]
-
blk.22.attn_output.weightQ8_0[4096 4096]
-
blk.22.attn_q.weightQ8_0[4096 4096]
-
blk.22.attn_v.weightQ8_0[4096 512]
-
blk.23.attn_norm.weightF32[4096]
-
blk.23.ffn_down.weightQ8_0[11008 4096]
-
blk.23.ffn_gate.weightQ8_0[4096 11008]
-
blk.23.ffn_up.weightQ8_0[4096 11008]
-
blk.23.ffn_norm.weightF32[4096]
-
blk.23.attn_k.weightQ8_0[4096 512]
-
blk.23.attn_output.weightQ8_0[4096 4096]
-
blk.23.attn_q.weightQ8_0[4096 4096]
-
blk.23.attn_v.weightQ8_0[4096 512]
-
blk.24.attn_norm.weightF32[4096]
-
blk.24.ffn_down.weightQ8_0[11008 4096]
-
blk.24.ffn_gate.weightQ8_0[4096 11008]
-
blk.24.ffn_up.weightQ8_0[4096 11008]
-
blk.24.ffn_norm.weightF32[4096]
-
blk.24.attn_k.weightQ8_0[4096 512]
-
blk.24.attn_output.weightQ8_0[4096 4096]
-
blk.24.attn_q.weightQ8_0[4096 4096]
-
blk.24.attn_v.weightQ8_0[4096 512]
-
blk.25.attn_norm.weightF32[4096]
-
blk.25.ffn_down.weightQ8_0[11008 4096]
-
blk.25.ffn_gate.weightQ8_0[4096 11008]
-
blk.25.ffn_up.weightQ8_0[4096 11008]
-
blk.25.ffn_norm.weightF32[4096]
-
blk.25.attn_k.weightQ8_0[4096 512]
-
blk.25.attn_output.weightQ8_0[4096 4096]
-
blk.25.attn_q.weightQ8_0[4096 4096]
-
blk.25.attn_v.weightQ8_0[4096 512]
-
blk.26.attn_norm.weightF32[4096]
-
blk.26.ffn_down.weightQ8_0[11008 4096]
-
blk.26.ffn_gate.weightQ8_0[4096 11008]
-
blk.26.ffn_up.weightQ8_0[4096 11008]
-
blk.26.ffn_norm.weightF32[4096]
-
blk.26.attn_k.weightQ8_0[4096 512]
-
blk.26.attn_output.weightQ8_0[4096 4096]
-
blk.26.attn_q.weightQ8_0[4096 4096]
-
blk.26.attn_v.weightQ8_0[4096 512]
-
blk.27.attn_k.weightQ8_0[4096 512]
-
blk.27.attn_q.weightQ8_0[4096 4096]
-
blk.27.attn_v.weightQ8_0[4096 512]
-
blk.27.attn_norm.weightF32[4096]
-
blk.27.ffn_down.weightQ8_0[11008 4096]
-
blk.27.ffn_gate.weightQ8_0[4096 11008]
-
blk.27.ffn_up.weightQ8_0[4096 11008]
-
blk.27.ffn_norm.weightF32[4096]
-
blk.27.attn_output.weightQ8_0[4096 4096]
-
blk.28.attn_norm.weightF32[4096]
-
blk.28.ffn_down.weightQ8_0[11008 4096]
-
blk.28.ffn_gate.weightQ8_0[4096 11008]
-
blk.28.ffn_up.weightQ8_0[4096 11008]
-
blk.28.ffn_norm.weightF32[4096]
-
blk.28.attn_k.weightQ8_0[4096 512]
-
blk.28.attn_output.weightQ8_0[4096 4096]
-
blk.28.attn_q.weightQ8_0[4096 4096]
-
blk.28.attn_v.weightQ8_0[4096 512]
-
blk.29.attn_norm.weightF32[4096]
-
blk.29.ffn_down.weightQ8_0[11008 4096]
-
blk.29.ffn_gate.weightQ8_0[4096 11008]
-
blk.29.ffn_up.weightQ8_0[4096 11008]
-
blk.29.ffn_norm.weightF32[4096]
-
blk.29.attn_k.weightQ8_0[4096 512]
-
blk.29.attn_output.weightQ8_0[4096 4096]
-
blk.29.attn_q.weightQ8_0[4096 4096]
-
blk.29.attn_v.weightQ8_0[4096 512]
-
blk.30.attn_norm.weightF32[4096]
-
blk.30.ffn_down.weightQ8_0[11008 4096]
-
blk.30.ffn_gate.weightQ8_0[4096 11008]
-
blk.30.ffn_up.weightQ8_0[4096 11008]
-
blk.30.ffn_norm.weightF32[4096]
-
blk.30.attn_k.weightQ8_0[4096 512]
-
blk.30.attn_output.weightQ8_0[4096 4096]
-
blk.30.attn_q.weightQ8_0[4096 4096]
-
blk.30.attn_v.weightQ8_0[4096 512]
-
blk.31.attn_norm.weightF32[4096]
-
blk.31.ffn_down.weightQ8_0[11008 4096]
-
blk.31.ffn_gate.weightQ8_0[4096 11008]
-
blk.31.ffn_up.weightQ8_0[4096 11008]
-
blk.31.ffn_norm.weightF32[4096]
-
blk.31.attn_k.weightQ8_0[4096 512]
-
blk.31.attn_output.weightQ8_0[4096 4096]
-
blk.31.attn_q.weightQ8_0[4096 4096]
-
blk.31.attn_v.weightQ8_0[4096 512]
-
blk.32.attn_norm.weightF32[4096]
-
blk.32.ffn_down.weightQ8_0[11008 4096]
-
blk.32.ffn_gate.weightQ8_0[4096 11008]
-
blk.32.ffn_up.weightQ8_0[4096 11008]
-
blk.32.ffn_norm.weightF32[4096]
-
blk.32.attn_k.weightQ8_0[4096 512]
-
blk.32.attn_output.weightQ8_0[4096 4096]
-
blk.32.attn_q.weightQ8_0[4096 4096]
-
blk.32.attn_v.weightQ8_0[4096 512]
-
blk.33.attn_norm.weightF32[4096]
-
blk.33.ffn_down.weightQ8_0[11008 4096]
-
blk.33.ffn_gate.weightQ8_0[4096 11008]
-
blk.33.ffn_up.weightQ8_0[4096 11008]
-
blk.33.ffn_norm.weightF32[4096]
-
blk.33.attn_k.weightQ8_0[4096 512]
-
blk.33.attn_output.weightQ8_0[4096 4096]
-
blk.33.attn_q.weightQ8_0[4096 4096]
-
blk.33.attn_v.weightQ8_0[4096 512]
-
blk.34.attn_norm.weightF32[4096]
-
blk.34.ffn_down.weightQ8_0[11008 4096]
-
blk.34.ffn_gate.weightQ8_0[4096 11008]
-
blk.34.ffn_up.weightQ8_0[4096 11008]
-
blk.34.ffn_norm.weightF32[4096]
-
blk.34.attn_k.weightQ8_0[4096 512]
-
blk.34.attn_output.weightQ8_0[4096 4096]
-
blk.34.attn_q.weightQ8_0[4096 4096]
-
blk.34.attn_v.weightQ8_0[4096 512]
-
blk.35.attn_norm.weightF32[4096]
-
blk.35.ffn_down.weightQ8_0[11008 4096]
-
blk.35.ffn_gate.weightQ8_0[4096 11008]
-
blk.35.ffn_up.weightQ8_0[4096 11008]
-
blk.35.ffn_norm.weightF32[4096]
-
blk.35.attn_k.weightQ8_0[4096 512]
-
blk.35.attn_output.weightQ8_0[4096 4096]
-
blk.35.attn_q.weightQ8_0[4096 4096]
-
blk.35.attn_v.weightQ8_0[4096 512]
-
blk.36.attn_norm.weightF32[4096]
-
blk.36.ffn_down.weightQ8_0[11008 4096]
-
blk.36.ffn_gate.weightQ8_0[4096 11008]
-
blk.36.ffn_up.weightQ8_0[4096 11008]
-
blk.36.ffn_norm.weightF32[4096]
-
blk.36.attn_k.weightQ8_0[4096 512]
-
blk.36.attn_output.weightQ8_0[4096 4096]
-
blk.36.attn_q.weightQ8_0[4096 4096]
-
blk.36.attn_v.weightQ8_0[4096 512]
-
blk.37.attn_norm.weightF32[4096]
-
blk.37.ffn_down.weightQ8_0[11008 4096]
-
blk.37.ffn_gate.weightQ8_0[4096 11008]
-
blk.37.ffn_up.weightQ8_0[4096 11008]
-
blk.37.ffn_norm.weightF32[4096]
-
blk.37.attn_k.weightQ8_0[4096 512]
-
blk.37.attn_output.weightQ8_0[4096 4096]
-
blk.37.attn_q.weightQ8_0[4096 4096]
-
blk.37.attn_v.weightQ8_0[4096 512]
-
blk.38.attn_norm.weightF32[4096]
-
blk.38.ffn_down.weightQ8_0[11008 4096]
-
blk.38.ffn_gate.weightQ8_0[4096 11008]
-
blk.38.ffn_up.weightQ8_0[4096 11008]
-
blk.38.ffn_norm.weightF32[4096]
-
blk.38.attn_k.weightQ8_0[4096 512]
-
blk.38.attn_output.weightQ8_0[4096 4096]
-
blk.38.attn_q.weightQ8_0[4096 4096]
-
blk.38.attn_v.weightQ8_0[4096 512]
-
blk.39.attn_norm.weightF32[4096]
-
blk.39.ffn_down.weightQ8_0[11008 4096]
-
blk.39.ffn_gate.weightQ8_0[4096 11008]
-
blk.39.ffn_up.weightQ8_0[4096 11008]
-
blk.39.ffn_norm.weightF32[4096]
-
blk.39.attn_k.weightQ8_0[4096 512]
-
blk.39.attn_output.weightQ8_0[4096 4096]
-
blk.39.attn_q.weightQ8_0[4096 4096]
-
blk.39.attn_v.weightQ8_0[4096 512]
-
blk.40.attn_norm.weightF32[4096]
-
blk.40.ffn_down.weightQ8_0[11008 4096]
-
blk.40.ffn_gate.weightQ8_0[4096 11008]
-
blk.40.ffn_up.weightQ8_0[4096 11008]
-
blk.40.ffn_norm.weightF32[4096]
-
blk.40.attn_k.weightQ8_0[4096 512]
-
blk.40.attn_output.weightQ8_0[4096 4096]
-
blk.40.attn_q.weightQ8_0[4096 4096]
-
blk.40.attn_v.weightQ8_0[4096 512]
-
blk.41.ffn_gate.weightQ8_0[4096 11008]
-
blk.41.attn_k.weightQ8_0[4096 512]
-
blk.41.attn_output.weightQ8_0[4096 4096]
-
blk.41.attn_q.weightQ8_0[4096 4096]
-
blk.41.attn_v.weightQ8_0[4096 512]
-
blk.41.attn_norm.weightF32[4096]
-
blk.41.ffn_down.weightQ8_0[11008 4096]
-
blk.41.ffn_up.weightQ8_0[4096 11008]
-
blk.41.ffn_norm.weightF32[4096]
-
blk.42.attn_norm.weightF32[4096]
-
blk.42.ffn_down.weightQ8_0[11008 4096]
-
blk.42.ffn_gate.weightQ8_0[4096 11008]
-
blk.42.ffn_up.weightQ8_0[4096 11008]
-
blk.42.ffn_norm.weightF32[4096]
-
blk.42.attn_k.weightQ8_0[4096 512]
-
blk.42.attn_output.weightQ8_0[4096 4096]
-
blk.42.attn_q.weightQ8_0[4096 4096]
-
blk.42.attn_v.weightQ8_0[4096 512]
-
blk.43.attn_norm.weightF32[4096]
-
blk.43.ffn_down.weightQ8_0[11008 4096]
-
blk.43.ffn_gate.weightQ8_0[4096 11008]
-
blk.43.ffn_up.weightQ8_0[4096 11008]
-
blk.43.ffn_norm.weightF32[4096]
-
blk.43.attn_k.weightQ8_0[4096 512]
-
blk.43.attn_output.weightQ8_0[4096 4096]
-
blk.43.attn_q.weightQ8_0[4096 4096]
-
blk.43.attn_v.weightQ8_0[4096 512]
-
blk.44.attn_norm.weightF32[4096]
-
blk.44.ffn_down.weightQ8_0[11008 4096]
-
blk.44.ffn_gate.weightQ8_0[4096 11008]
-
blk.44.ffn_up.weightQ8_0[4096 11008]
-
blk.44.ffn_norm.weightF32[4096]
-
blk.44.attn_k.weightQ8_0[4096 512]
-
blk.44.attn_output.weightQ8_0[4096 4096]
-
blk.44.attn_q.weightQ8_0[4096 4096]
-
blk.44.attn_v.weightQ8_0[4096 512]
-
blk.45.attn_norm.weightF32[4096]
-
blk.45.ffn_down.weightQ8_0[11008 4096]
-
blk.45.ffn_gate.weightQ8_0[4096 11008]
-
blk.45.ffn_up.weightQ8_0[4096 11008]
-
blk.45.ffn_norm.weightF32[4096]
-
blk.45.attn_k.weightQ8_0[4096 512]
-
blk.45.attn_output.weightQ8_0[4096 4096]
-
blk.45.attn_q.weightQ8_0[4096 4096]
-
blk.45.attn_v.weightQ8_0[4096 512]
-
blk.46.attn_norm.weightF32[4096]
-
blk.46.ffn_down.weightQ8_0[11008 4096]
-
blk.46.ffn_gate.weightQ8_0[4096 11008]
-
blk.46.ffn_up.weightQ8_0[4096 11008]
-
blk.46.ffn_norm.weightF32[4096]
-
blk.46.attn_k.weightQ8_0[4096 512]
-
blk.46.attn_output.weightQ8_0[4096 4096]
-
blk.46.attn_q.weightQ8_0[4096 4096]
-
blk.46.attn_v.weightQ8_0[4096 512]
-
blk.47.attn_norm.weightF32[4096]
-
blk.47.ffn_down.weightQ8_0[11008 4096]
-
blk.47.ffn_gate.weightQ8_0[4096 11008]
-
blk.47.ffn_up.weightQ8_0[4096 11008]
-
blk.47.ffn_norm.weightF32[4096]
-
blk.47.attn_k.weightQ8_0[4096 512]
-
blk.47.attn_output.weightQ8_0[4096 4096]
-
blk.47.attn_q.weightQ8_0[4096 4096]
-
blk.47.attn_v.weightQ8_0[4096 512]
-
output.weightQ8_0[4096 64000]
-
output_norm.weightF32[4096]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47