latest
40GB
🦙🦙🦙 Llama3-70B-Chinese-Chat is an instruction-tuned language model for Chinese & English users with various abilities such as roleplaying & tool-using built upon the Meta-Llama-3-70B-Instruct model.
70B
182 Pulls Updated 4 months ago
23cd31b73d5d · 40GB
-
general.architecturellama
-
general.file_typeQ4_0
-
llama.attention.head_count64
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count80
-
llama.context_length8192
-
llama.embedding_length8192
-
llama.feed_forward_length28672
-
llama.rope.dimension_count128
-
llama.rope.freq_base500000
-
llama.vocab_size128256
-
tokenizer.ggml.bos_token_id128000
-
tokenizer.ggml.eos_token_id128009
-
tokenizer.ggml.merges[Ä Ä Ä Ä Ä Ä Ä Ä Ä Ä Ä Ä Ä Ä i n ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id128009
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weightQ4_0[8192 128256]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.ffn_down.weightQ4_0[28672 8192]
-
blk.0.ffn_gate.weightQ4_0[8192 28672]
-
blk.0.ffn_up.weightQ4_0[8192 28672]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.attn_k.weightQ4_0[8192 1024]
-
blk.0.attn_output.weightQ4_0[8192 8192]
-
blk.0.attn_q.weightQ4_0[8192 8192]
-
blk.0.attn_v.weightQ4_0[8192 1024]
-
blk.1.ffn_gate.weightQ4_0[8192 28672]
-
blk.1.attn_k.weightQ4_0[8192 1024]
-
blk.1.attn_output.weightQ4_0[8192 8192]
-
blk.1.attn_q.weightQ4_0[8192 8192]
-
blk.1.attn_v.weightQ4_0[8192 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.ffn_down.weightQ4_0[28672 8192]
-
blk.1.ffn_up.weightQ4_0[8192 28672]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.ffn_down.weightQ4_0[28672 8192]
-
blk.2.ffn_gate.weightQ4_0[8192 28672]
-
blk.2.ffn_up.weightQ4_0[8192 28672]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.2.attn_k.weightQ4_0[8192 1024]
-
blk.2.attn_output.weightQ4_0[8192 8192]
-
blk.2.attn_q.weightQ4_0[8192 8192]
-
blk.2.attn_v.weightQ4_0[8192 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.ffn_down.weightQ4_0[28672 8192]
-
blk.3.ffn_gate.weightQ4_0[8192 28672]
-
blk.3.ffn_up.weightQ4_0[8192 28672]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.3.attn_k.weightQ4_0[8192 1024]
-
blk.3.attn_output.weightQ4_0[8192 8192]
-
blk.3.attn_q.weightQ4_0[8192 8192]
-
blk.3.attn_v.weightQ4_0[8192 1024]
-
blk.4.attn_k.weightQ4_0[8192 1024]
-
blk.4.attn_output.weightQ4_0[8192 8192]
-
blk.4.attn_q.weightQ4_0[8192 8192]
-
blk.4.attn_v.weightQ4_0[8192 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.ffn_down.weightQ4_0[28672 8192]
-
blk.4.ffn_gate.weightQ4_0[8192 28672]
-
blk.4.ffn_up.weightQ4_0[8192 28672]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.ffn_down.weightQ4_0[28672 8192]
-
blk.5.ffn_gate.weightQ4_0[8192 28672]
-
blk.5.ffn_up.weightQ4_0[8192 28672]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.5.attn_k.weightQ4_0[8192 1024]
-
blk.5.attn_output.weightQ4_0[8192 8192]
-
blk.5.attn_q.weightQ4_0[8192 8192]
-
blk.5.attn_v.weightQ4_0[8192 1024]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.ffn_down.weightQ4_0[28672 8192]
-
blk.6.ffn_gate.weightQ4_0[8192 28672]
-
blk.6.ffn_up.weightQ4_0[8192 28672]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.6.attn_k.weightQ4_0[8192 1024]
-
blk.6.attn_output.weightQ4_0[8192 8192]
-
blk.6.attn_q.weightQ4_0[8192 8192]
-
blk.6.attn_v.weightQ4_0[8192 1024]
-
blk.7.attn_k.weightQ4_0[8192 1024]
-
blk.7.attn_q.weightQ4_0[8192 8192]
-
blk.7.attn_v.weightQ4_0[8192 1024]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.ffn_down.weightQ4_0[28672 8192]
-
blk.7.ffn_gate.weightQ4_0[8192 28672]
-
blk.7.ffn_up.weightQ4_0[8192 28672]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.7.attn_output.weightQ4_0[8192 8192]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.ffn_down.weightQ4_0[28672 8192]
-
blk.8.ffn_gate.weightQ4_0[8192 28672]
-
blk.8.ffn_up.weightQ4_0[8192 28672]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.attn_k.weightQ4_0[8192 1024]
-
blk.8.attn_output.weightQ4_0[8192 8192]
-
blk.8.attn_q.weightQ4_0[8192 8192]
-
blk.8.attn_v.weightQ4_0[8192 1024]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.ffn_down.weightQ4_0[28672 8192]
-
blk.9.ffn_gate.weightQ4_0[8192 28672]
-
blk.9.ffn_up.weightQ4_0[8192 28672]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.attn_k.weightQ4_0[8192 1024]
-
blk.9.attn_output.weightQ4_0[8192 8192]
-
blk.9.attn_q.weightQ4_0[8192 8192]
-
blk.9.attn_v.weightQ4_0[8192 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.ffn_down.weightQ4_0[28672 8192]
-
blk.10.ffn_gate.weightQ4_0[8192 28672]
-
blk.10.ffn_up.weightQ4_0[8192 28672]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.10.attn_k.weightQ4_0[8192 1024]
-
blk.10.attn_output.weightQ4_0[8192 8192]
-
blk.10.attn_q.weightQ4_0[8192 8192]
-
blk.10.attn_v.weightQ4_0[8192 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.ffn_down.weightQ4_0[28672 8192]
-
blk.11.ffn_gate.weightQ4_0[8192 28672]
-
blk.11.ffn_up.weightQ4_0[8192 28672]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.11.attn_k.weightQ4_0[8192 1024]
-
blk.11.attn_output.weightQ4_0[8192 8192]
-
blk.11.attn_q.weightQ4_0[8192 8192]
-
blk.11.attn_v.weightQ4_0[8192 1024]
-
blk.12.ffn_gate.weightQ4_0[8192 28672]
-
blk.12.ffn_up.weightQ4_0[8192 28672]
-
blk.12.attn_k.weightQ4_0[8192 1024]
-
blk.12.attn_output.weightQ4_0[8192 8192]
-
blk.12.attn_q.weightQ4_0[8192 8192]
-
blk.12.attn_v.weightQ4_0[8192 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.ffn_down.weightQ4_0[28672 8192]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.ffn_down.weightQ4_0[28672 8192]
-
blk.13.ffn_gate.weightQ4_0[8192 28672]
-
blk.13.ffn_up.weightQ4_0[8192 28672]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.13.attn_k.weightQ4_0[8192 1024]
-
blk.13.attn_output.weightQ4_0[8192 8192]
-
blk.13.attn_q.weightQ4_0[8192 8192]
-
blk.13.attn_v.weightQ4_0[8192 1024]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.ffn_down.weightQ4_0[28672 8192]
-
blk.14.ffn_gate.weightQ4_0[8192 28672]
-
blk.14.ffn_up.weightQ4_0[8192 28672]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.14.attn_k.weightQ4_0[8192 1024]
-
blk.14.attn_output.weightQ4_0[8192 8192]
-
blk.14.attn_q.weightQ4_0[8192 8192]
-
blk.14.attn_v.weightQ4_0[8192 1024]
-
blk.15.ffn_gate.weightQ4_0[8192 28672]
-
blk.15.attn_k.weightQ4_0[8192 1024]
-
blk.15.attn_output.weightQ4_0[8192 8192]
-
blk.15.attn_q.weightQ4_0[8192 8192]
-
blk.15.attn_v.weightQ4_0[8192 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.ffn_down.weightQ4_0[28672 8192]
-
blk.15.ffn_up.weightQ4_0[8192 28672]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.ffn_down.weightQ4_0[28672 8192]
-
blk.16.ffn_gate.weightQ4_0[8192 28672]
-
blk.16.ffn_up.weightQ4_0[8192 28672]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.16.attn_k.weightQ4_0[8192 1024]
-
blk.16.attn_output.weightQ4_0[8192 8192]
-
blk.16.attn_q.weightQ4_0[8192 8192]
-
blk.16.attn_v.weightQ4_0[8192 1024]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.ffn_down.weightQ4_0[28672 8192]
-
blk.17.ffn_gate.weightQ4_0[8192 28672]
-
blk.17.ffn_up.weightQ4_0[8192 28672]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.17.attn_k.weightQ4_0[8192 1024]
-
blk.17.attn_output.weightQ4_0[8192 8192]
-
blk.17.attn_q.weightQ4_0[8192 8192]
-
blk.17.attn_v.weightQ4_0[8192 1024]
-
blk.18.attn_k.weightQ4_0[8192 1024]
-
blk.18.attn_output.weightQ4_0[8192 8192]
-
blk.18.attn_q.weightQ4_0[8192 8192]
-
blk.18.attn_v.weightQ4_0[8192 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.ffn_down.weightQ4_0[28672 8192]
-
blk.18.ffn_gate.weightQ4_0[8192 28672]
-
blk.18.ffn_up.weightQ4_0[8192 28672]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.ffn_down.weightQ4_0[28672 8192]
-
blk.19.ffn_gate.weightQ4_0[8192 28672]
-
blk.19.ffn_up.weightQ4_0[8192 28672]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.19.attn_k.weightQ4_0[8192 1024]
-
blk.19.attn_output.weightQ4_0[8192 8192]
-
blk.19.attn_q.weightQ4_0[8192 8192]
-
blk.19.attn_v.weightQ4_0[8192 1024]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.ffn_down.weightQ4_0[28672 8192]
-
blk.20.ffn_gate.weightQ4_0[8192 28672]
-
blk.20.ffn_up.weightQ4_0[8192 28672]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.20.attn_k.weightQ4_0[8192 1024]
-
blk.20.attn_output.weightQ4_0[8192 8192]
-
blk.20.attn_q.weightQ4_0[8192 8192]
-
blk.20.attn_v.weightQ4_0[8192 1024]
-
blk.21.attn_k.weightQ4_0[8192 1024]
-
blk.21.attn_q.weightQ4_0[8192 8192]
-
blk.21.attn_v.weightQ4_0[8192 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.ffn_down.weightQ4_0[28672 8192]
-
blk.21.ffn_gate.weightQ4_0[8192 28672]
-
blk.21.ffn_up.weightQ4_0[8192 28672]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.attn_output.weightQ4_0[8192 8192]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.ffn_down.weightQ4_0[28672 8192]
-
blk.22.ffn_gate.weightQ4_0[8192 28672]
-
blk.22.ffn_up.weightQ4_0[8192 28672]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.22.attn_k.weightQ4_0[8192 1024]
-
blk.22.attn_output.weightQ4_0[8192 8192]
-
blk.22.attn_q.weightQ4_0[8192 8192]
-
blk.22.attn_v.weightQ4_0[8192 1024]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.ffn_down.weightQ4_0[28672 8192]
-
blk.23.ffn_gate.weightQ4_0[8192 28672]
-
blk.23.ffn_up.weightQ4_0[8192 28672]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.23.attn_k.weightQ4_0[8192 1024]
-
blk.23.attn_output.weightQ4_0[8192 8192]
-
blk.23.attn_q.weightQ4_0[8192 8192]
-
blk.23.attn_v.weightQ4_0[8192 1024]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.ffn_down.weightQ4_0[28672 8192]
-
blk.24.ffn_gate.weightQ4_0[8192 28672]
-
blk.24.ffn_up.weightQ4_0[8192 28672]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.attn_k.weightQ4_0[8192 1024]
-
blk.24.attn_output.weightQ4_0[8192 8192]
-
blk.24.attn_q.weightQ4_0[8192 8192]
-
blk.24.attn_v.weightQ4_0[8192 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.ffn_down.weightQ4_0[28672 8192]
-
blk.25.ffn_gate.weightQ4_0[8192 28672]
-
blk.25.ffn_up.weightQ4_0[8192 28672]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.attn_k.weightQ4_0[8192 1024]
-
blk.25.attn_output.weightQ4_0[8192 8192]
-
blk.25.attn_q.weightQ4_0[8192 8192]
-
blk.25.attn_v.weightQ4_0[8192 1024]
-
blk.26.ffn_gate.weightQ4_0[8192 28672]
-
blk.26.ffn_up.weightQ4_0[8192 28672]
-
blk.26.attn_k.weightQ4_0[8192 1024]
-
blk.26.attn_output.weightQ4_0[8192 8192]
-
blk.26.attn_q.weightQ4_0[8192 8192]
-
blk.26.attn_v.weightQ4_0[8192 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.ffn_down.weightQ4_0[28672 8192]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.ffn_down.weightQ4_0[28672 8192]
-
blk.27.ffn_gate.weightQ4_0[8192 28672]
-
blk.27.ffn_up.weightQ4_0[8192 28672]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.27.attn_k.weightQ4_0[8192 1024]
-
blk.27.attn_output.weightQ4_0[8192 8192]
-
blk.27.attn_q.weightQ4_0[8192 8192]
-
blk.27.attn_v.weightQ4_0[8192 1024]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.ffn_down.weightQ4_0[28672 8192]
-
blk.28.ffn_gate.weightQ4_0[8192 28672]
-
blk.28.ffn_up.weightQ4_0[8192 28672]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.attn_k.weightQ4_0[8192 1024]
-
blk.28.attn_output.weightQ4_0[8192 8192]
-
blk.28.attn_q.weightQ4_0[8192 8192]
-
blk.28.attn_v.weightQ4_0[8192 1024]
-
blk.29.ffn_gate.weightQ4_0[8192 28672]
-
blk.29.attn_k.weightQ4_0[8192 1024]
-
blk.29.attn_output.weightQ4_0[8192 8192]
-
blk.29.attn_q.weightQ4_0[8192 8192]
-
blk.29.attn_v.weightQ4_0[8192 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.ffn_down.weightQ4_0[28672 8192]
-
blk.29.ffn_up.weightQ4_0[8192 28672]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.ffn_down.weightQ4_0[28672 8192]
-
blk.30.ffn_gate.weightQ4_0[8192 28672]
-
blk.30.ffn_up.weightQ4_0[8192 28672]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.30.attn_k.weightQ4_0[8192 1024]
-
blk.30.attn_output.weightQ4_0[8192 8192]
-
blk.30.attn_q.weightQ4_0[8192 8192]
-
blk.30.attn_v.weightQ4_0[8192 1024]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.ffn_down.weightQ4_0[28672 8192]
-
blk.31.ffn_gate.weightQ4_0[8192 28672]
-
blk.31.ffn_up.weightQ4_0[8192 28672]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.31.attn_k.weightQ4_0[8192 1024]
-
blk.31.attn_output.weightQ4_0[8192 8192]
-
blk.31.attn_q.weightQ4_0[8192 8192]
-
blk.31.attn_v.weightQ4_0[8192 1024]
-
blk.32.attn_k.weightQ4_0[8192 1024]
-
blk.32.attn_output.weightQ4_0[8192 8192]
-
blk.32.attn_q.weightQ4_0[8192 8192]
-
blk.32.attn_v.weightQ4_0[8192 1024]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.ffn_down.weightQ4_0[28672 8192]
-
blk.32.ffn_gate.weightQ4_0[8192 28672]
-
blk.32.ffn_up.weightQ4_0[8192 28672]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.ffn_down.weightQ4_0[28672 8192]
-
blk.33.ffn_gate.weightQ4_0[8192 28672]
-
blk.33.ffn_up.weightQ4_0[8192 28672]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.33.attn_k.weightQ4_0[8192 1024]
-
blk.33.attn_output.weightQ4_0[8192 8192]
-
blk.33.attn_q.weightQ4_0[8192 8192]
-
blk.33.attn_v.weightQ4_0[8192 1024]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.ffn_down.weightQ4_0[28672 8192]
-
blk.34.ffn_gate.weightQ4_0[8192 28672]
-
blk.34.ffn_up.weightQ4_0[8192 28672]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.34.attn_k.weightQ4_0[8192 1024]
-
blk.34.attn_output.weightQ4_0[8192 8192]
-
blk.34.attn_q.weightQ4_0[8192 8192]
-
blk.34.attn_v.weightQ4_0[8192 1024]
-
blk.35.attn_k.weightQ4_0[8192 1024]
-
blk.35.attn_q.weightQ4_0[8192 8192]
-
blk.35.attn_v.weightQ4_0[8192 1024]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.ffn_down.weightQ4_0[28672 8192]
-
blk.35.ffn_gate.weightQ4_0[8192 28672]
-
blk.35.ffn_up.weightQ4_0[8192 28672]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.35.attn_output.weightQ4_0[8192 8192]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.ffn_down.weightQ4_0[28672 8192]
-
blk.36.ffn_gate.weightQ4_0[8192 28672]
-
blk.36.ffn_up.weightQ4_0[8192 28672]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.attn_k.weightQ4_0[8192 1024]
-
blk.36.attn_output.weightQ4_0[8192 8192]
-
blk.36.attn_q.weightQ4_0[8192 8192]
-
blk.36.attn_v.weightQ4_0[8192 1024]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.ffn_down.weightQ4_0[28672 8192]
-
blk.37.ffn_gate.weightQ4_0[8192 28672]
-
blk.37.ffn_up.weightQ4_0[8192 28672]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.attn_k.weightQ4_0[8192 1024]
-
blk.37.attn_output.weightQ4_0[8192 8192]
-
blk.37.attn_q.weightQ4_0[8192 8192]
-
blk.37.attn_v.weightQ4_0[8192 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.ffn_down.weightQ4_0[28672 8192]
-
blk.38.ffn_gate.weightQ4_0[8192 28672]
-
blk.38.ffn_up.weightQ4_0[8192 28672]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.38.attn_k.weightQ4_0[8192 1024]
-
blk.38.attn_output.weightQ4_0[8192 8192]
-
blk.38.attn_q.weightQ4_0[8192 8192]
-
blk.38.attn_v.weightQ4_0[8192 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.ffn_down.weightQ4_0[28672 8192]
-
blk.39.ffn_gate.weightQ4_0[8192 28672]
-
blk.39.ffn_up.weightQ4_0[8192 28672]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.39.attn_k.weightQ4_0[8192 1024]
-
blk.39.attn_output.weightQ4_0[8192 8192]
-
blk.39.attn_q.weightQ4_0[8192 8192]
-
blk.39.attn_v.weightQ4_0[8192 1024]
-
blk.40.ffn_gate.weightQ4_0[8192 28672]
-
blk.40.ffn_up.weightQ4_0[8192 28672]
-
blk.40.attn_k.weightQ4_0[8192 1024]
-
blk.40.attn_output.weightQ4_0[8192 8192]
-
blk.40.attn_q.weightQ4_0[8192 8192]
-
blk.40.attn_v.weightQ4_0[8192 1024]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.ffn_down.weightQ4_0[28672 8192]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.ffn_down.weightQ4_0[28672 8192]
-
blk.41.ffn_gate.weightQ4_0[8192 28672]
-
blk.41.ffn_up.weightQ4_0[8192 28672]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.41.attn_k.weightQ4_0[8192 1024]
-
blk.41.attn_output.weightQ4_0[8192 8192]
-
blk.41.attn_q.weightQ4_0[8192 8192]
-
blk.41.attn_v.weightQ4_0[8192 1024]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.ffn_down.weightQ4_0[28672 8192]
-
blk.42.ffn_gate.weightQ4_0[8192 28672]
-
blk.42.ffn_up.weightQ4_0[8192 28672]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.42.attn_k.weightQ4_0[8192 1024]
-
blk.42.attn_output.weightQ4_0[8192 8192]
-
blk.42.attn_q.weightQ4_0[8192 8192]
-
blk.42.attn_v.weightQ4_0[8192 1024]
-
blk.43.ffn_gate.weightQ4_0[8192 28672]
-
blk.43.attn_k.weightQ4_0[8192 1024]
-
blk.43.attn_output.weightQ4_0[8192 8192]
-
blk.43.attn_q.weightQ4_0[8192 8192]
-
blk.43.attn_v.weightQ4_0[8192 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.ffn_down.weightQ4_0[28672 8192]
-
blk.43.ffn_up.weightQ4_0[8192 28672]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.ffn_down.weightQ4_0[28672 8192]
-
blk.44.ffn_gate.weightQ4_0[8192 28672]
-
blk.44.ffn_up.weightQ4_0[8192 28672]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.44.attn_k.weightQ4_0[8192 1024]
-
blk.44.attn_output.weightQ4_0[8192 8192]
-
blk.44.attn_q.weightQ4_0[8192 8192]
-
blk.44.attn_v.weightQ4_0[8192 1024]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.ffn_down.weightQ4_0[28672 8192]
-
blk.45.ffn_gate.weightQ4_0[8192 28672]
-
blk.45.ffn_up.weightQ4_0[8192 28672]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.attn_k.weightQ4_0[8192 1024]
-
blk.45.attn_output.weightQ4_0[8192 8192]
-
blk.45.attn_q.weightQ4_0[8192 8192]
-
blk.45.attn_v.weightQ4_0[8192 1024]
-
blk.46.attn_k.weightQ4_0[8192 1024]
-
blk.46.attn_output.weightQ4_0[8192 8192]
-
blk.46.attn_q.weightQ4_0[8192 8192]
-
blk.46.attn_v.weightQ4_0[8192 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.ffn_down.weightQ4_0[28672 8192]
-
blk.46.ffn_gate.weightQ4_0[8192 28672]
-
blk.46.ffn_up.weightQ4_0[8192 28672]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.ffn_down.weightQ4_0[28672 8192]
-
blk.47.ffn_gate.weightQ4_0[8192 28672]
-
blk.47.ffn_up.weightQ4_0[8192 28672]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.47.attn_k.weightQ4_0[8192 1024]
-
blk.47.attn_output.weightQ4_0[8192 8192]
-
blk.47.attn_q.weightQ4_0[8192 8192]
-
blk.47.attn_v.weightQ4_0[8192 1024]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.ffn_down.weightQ4_0[28672 8192]
-
blk.48.ffn_gate.weightQ4_0[8192 28672]
-
blk.48.ffn_up.weightQ4_0[8192 28672]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.48.attn_k.weightQ4_0[8192 1024]
-
blk.48.attn_output.weightQ4_0[8192 8192]
-
blk.48.attn_q.weightQ4_0[8192 8192]
-
blk.48.attn_v.weightQ4_0[8192 1024]
-
blk.49.attn_k.weightQ4_0[8192 1024]
-
blk.49.attn_q.weightQ4_0[8192 8192]
-
blk.49.attn_v.weightQ4_0[8192 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.ffn_down.weightQ4_0[28672 8192]
-
blk.49.ffn_gate.weightQ4_0[8192 28672]
-
blk.49.ffn_up.weightQ4_0[8192 28672]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.49.attn_output.weightQ4_0[8192 8192]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.ffn_down.weightQ4_0[28672 8192]
-
blk.50.ffn_gate.weightQ4_0[8192 28672]
-
blk.50.ffn_up.weightQ4_0[8192 28672]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.50.attn_k.weightQ4_0[8192 1024]
-
blk.50.attn_output.weightQ4_0[8192 8192]
-
blk.50.attn_q.weightQ4_0[8192 8192]
-
blk.50.attn_v.weightQ4_0[8192 1024]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.ffn_down.weightQ4_0[28672 8192]
-
blk.51.ffn_gate.weightQ4_0[8192 28672]
-
blk.51.ffn_up.weightQ4_0[8192 28672]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.51.attn_k.weightQ4_0[8192 1024]
-
blk.51.attn_output.weightQ4_0[8192 8192]
-
blk.51.attn_q.weightQ4_0[8192 8192]
-
blk.51.attn_v.weightQ4_0[8192 1024]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.ffn_down.weightQ4_0[28672 8192]
-
blk.52.ffn_gate.weightQ4_0[8192 28672]
-
blk.52.ffn_up.weightQ4_0[8192 28672]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.52.attn_k.weightQ4_0[8192 1024]
-
blk.52.attn_output.weightQ4_0[8192 8192]
-
blk.52.attn_q.weightQ4_0[8192 8192]
-
blk.52.attn_v.weightQ4_0[8192 1024]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.ffn_down.weightQ4_0[28672 8192]
-
blk.53.ffn_gate.weightQ4_0[8192 28672]
-
blk.53.ffn_up.weightQ4_0[8192 28672]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.53.attn_k.weightQ4_0[8192 1024]
-
blk.53.attn_output.weightQ4_0[8192 8192]
-
blk.53.attn_q.weightQ4_0[8192 8192]
-
blk.53.attn_v.weightQ4_0[8192 1024]
-
blk.54.ffn_gate.weightQ4_0[8192 28672]
-
blk.54.ffn_up.weightQ4_0[8192 28672]
-
blk.54.attn_k.weightQ4_0[8192 1024]
-
blk.54.attn_output.weightQ4_0[8192 8192]
-
blk.54.attn_q.weightQ4_0[8192 8192]
-
blk.54.attn_v.weightQ4_0[8192 1024]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.ffn_down.weightQ4_0[28672 8192]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.ffn_down.weightQ4_0[28672 8192]
-
blk.55.ffn_gate.weightQ4_0[8192 28672]
-
blk.55.ffn_up.weightQ4_0[8192 28672]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.55.attn_k.weightQ4_0[8192 1024]
-
blk.55.attn_output.weightQ4_0[8192 8192]
-
blk.55.attn_q.weightQ4_0[8192 8192]
-
blk.55.attn_v.weightQ4_0[8192 1024]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.ffn_down.weightQ4_0[28672 8192]
-
blk.56.ffn_gate.weightQ4_0[8192 28672]
-
blk.56.ffn_up.weightQ4_0[8192 28672]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.56.attn_k.weightQ4_0[8192 1024]
-
blk.56.attn_output.weightQ4_0[8192 8192]
-
blk.56.attn_q.weightQ4_0[8192 8192]
-
blk.56.attn_v.weightQ4_0[8192 1024]
-
blk.57.ffn_gate.weightQ4_0[8192 28672]
-
blk.57.attn_k.weightQ4_0[8192 1024]
-
blk.57.attn_output.weightQ4_0[8192 8192]
-
blk.57.attn_q.weightQ4_0[8192 8192]
-
blk.57.attn_v.weightQ4_0[8192 1024]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.ffn_down.weightQ4_0[28672 8192]
-
blk.57.ffn_up.weightQ4_0[8192 28672]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.ffn_down.weightQ4_0[28672 8192]
-
blk.58.ffn_gate.weightQ4_0[8192 28672]
-
blk.58.ffn_up.weightQ4_0[8192 28672]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.58.attn_k.weightQ4_0[8192 1024]
-
blk.58.attn_output.weightQ4_0[8192 8192]
-
blk.58.attn_q.weightQ4_0[8192 8192]
-
blk.58.attn_v.weightQ4_0[8192 1024]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.ffn_down.weightQ4_0[28672 8192]
-
blk.59.ffn_gate.weightQ4_0[8192 28672]
-
blk.59.ffn_up.weightQ4_0[8192 28672]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.59.attn_k.weightQ4_0[8192 1024]
-
blk.59.attn_output.weightQ4_0[8192 8192]
-
blk.59.attn_q.weightQ4_0[8192 8192]
-
blk.59.attn_v.weightQ4_0[8192 1024]
-
blk.60.attn_k.weightQ4_0[8192 1024]
-
blk.60.attn_output.weightQ4_0[8192 8192]
-
blk.60.attn_q.weightQ4_0[8192 8192]
-
blk.60.attn_v.weightQ4_0[8192 1024]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.ffn_down.weightQ4_0[28672 8192]
-
blk.60.ffn_gate.weightQ4_0[8192 28672]
-
blk.60.ffn_up.weightQ4_0[8192 28672]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.ffn_down.weightQ4_0[28672 8192]
-
blk.61.ffn_gate.weightQ4_0[8192 28672]
-
blk.61.ffn_up.weightQ4_0[8192 28672]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.61.attn_k.weightQ4_0[8192 1024]
-
blk.61.attn_output.weightQ4_0[8192 8192]
-
blk.61.attn_q.weightQ4_0[8192 8192]
-
blk.61.attn_v.weightQ4_0[8192 1024]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.ffn_down.weightQ4_0[28672 8192]
-
blk.62.ffn_gate.weightQ4_0[8192 28672]
-
blk.62.ffn_up.weightQ4_0[8192 28672]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.62.attn_k.weightQ4_0[8192 1024]
-
blk.62.attn_output.weightQ4_0[8192 8192]
-
blk.62.attn_q.weightQ4_0[8192 8192]
-
blk.62.attn_v.weightQ4_0[8192 1024]
-
blk.63.attn_k.weightQ4_0[8192 1024]
-
blk.63.attn_q.weightQ4_0[8192 8192]
-
blk.63.attn_v.weightQ4_0[8192 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.ffn_down.weightQ4_0[28672 8192]
-
blk.63.ffn_gate.weightQ4_0[8192 28672]
-
blk.63.ffn_up.weightQ4_0[8192 28672]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.63.attn_output.weightQ4_0[8192 8192]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.ffn_down.weightQ4_0[28672 8192]
-
blk.64.ffn_gate.weightQ4_0[8192 28672]
-
blk.64.ffn_up.weightQ4_0[8192 28672]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.64.attn_k.weightQ4_0[8192 1024]
-
blk.64.attn_output.weightQ4_0[8192 8192]
-
blk.64.attn_q.weightQ4_0[8192 8192]
-
blk.64.attn_v.weightQ4_0[8192 1024]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.ffn_down.weightQ4_0[28672 8192]
-
blk.65.ffn_gate.weightQ4_0[8192 28672]
-
blk.65.ffn_up.weightQ4_0[8192 28672]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.attn_k.weightQ4_0[8192 1024]
-
blk.65.attn_output.weightQ4_0[8192 8192]
-
blk.65.attn_q.weightQ4_0[8192 8192]
-
blk.65.attn_v.weightQ4_0[8192 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.ffn_down.weightQ4_0[28672 8192]
-
blk.66.ffn_gate.weightQ4_0[8192 28672]
-
blk.66.ffn_up.weightQ4_0[8192 28672]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.66.attn_k.weightQ4_0[8192 1024]
-
blk.66.attn_output.weightQ4_0[8192 8192]
-
blk.66.attn_q.weightQ4_0[8192 8192]
-
blk.66.attn_v.weightQ4_0[8192 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.ffn_down.weightQ4_0[28672 8192]
-
blk.67.ffn_gate.weightQ4_0[8192 28672]
-
blk.67.ffn_up.weightQ4_0[8192 28672]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.67.attn_k.weightQ4_0[8192 1024]
-
blk.67.attn_output.weightQ4_0[8192 8192]
-
blk.67.attn_q.weightQ4_0[8192 8192]
-
blk.67.attn_v.weightQ4_0[8192 1024]
-
blk.68.ffn_gate.weightQ4_0[8192 28672]
-
blk.68.ffn_up.weightQ4_0[8192 28672]
-
blk.68.attn_k.weightQ4_0[8192 1024]
-
blk.68.attn_output.weightQ4_0[8192 8192]
-
blk.68.attn_q.weightQ4_0[8192 8192]
-
blk.68.attn_v.weightQ4_0[8192 1024]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.ffn_down.weightQ4_0[28672 8192]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.ffn_down.weightQ4_0[28672 8192]
-
blk.69.ffn_gate.weightQ4_0[8192 28672]
-
blk.69.ffn_up.weightQ4_0[8192 28672]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.69.attn_k.weightQ4_0[8192 1024]
-
blk.69.attn_output.weightQ4_0[8192 8192]
-
blk.69.attn_q.weightQ4_0[8192 8192]
-
blk.69.attn_v.weightQ4_0[8192 1024]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.ffn_down.weightQ4_0[28672 8192]
-
blk.70.ffn_gate.weightQ4_0[8192 28672]
-
blk.70.ffn_up.weightQ4_0[8192 28672]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.70.attn_k.weightQ4_0[8192 1024]
-
blk.70.attn_output.weightQ4_0[8192 8192]
-
blk.70.attn_q.weightQ4_0[8192 8192]
-
blk.70.attn_v.weightQ4_0[8192 1024]
-
blk.71.ffn_gate.weightQ4_0[8192 28672]
-
blk.71.attn_k.weightQ4_0[8192 1024]
-
blk.71.attn_output.weightQ4_0[8192 8192]
-
blk.71.attn_q.weightQ4_0[8192 8192]
-
blk.71.attn_v.weightQ4_0[8192 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.ffn_down.weightQ4_0[28672 8192]
-
blk.71.ffn_up.weightQ4_0[8192 28672]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.ffn_down.weightQ4_0[28672 8192]
-
blk.72.ffn_gate.weightQ4_0[8192 28672]
-
blk.72.ffn_up.weightQ4_0[8192 28672]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.72.attn_k.weightQ4_0[8192 1024]
-
blk.72.attn_output.weightQ4_0[8192 8192]
-
blk.72.attn_q.weightQ4_0[8192 8192]
-
blk.72.attn_v.weightQ4_0[8192 1024]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.ffn_down.weightQ4_0[28672 8192]
-
blk.73.ffn_gate.weightQ4_0[8192 28672]
-
blk.73.ffn_up.weightQ4_0[8192 28672]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.attn_k.weightQ4_0[8192 1024]
-
blk.73.attn_output.weightQ4_0[8192 8192]
-
blk.73.attn_q.weightQ4_0[8192 8192]
-
blk.73.attn_v.weightQ4_0[8192 1024]
-
blk.74.attn_k.weightQ4_0[8192 1024]
-
blk.74.attn_output.weightQ4_0[8192 8192]
-
blk.74.attn_q.weightQ4_0[8192 8192]
-
blk.74.attn_v.weightQ4_0[8192 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.ffn_down.weightQ4_0[28672 8192]
-
blk.74.ffn_gate.weightQ4_0[8192 28672]
-
blk.74.ffn_up.weightQ4_0[8192 28672]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.ffn_down.weightQ4_0[28672 8192]
-
blk.75.ffn_gate.weightQ4_0[8192 28672]
-
blk.75.ffn_up.weightQ4_0[8192 28672]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.75.attn_k.weightQ4_0[8192 1024]
-
blk.75.attn_output.weightQ4_0[8192 8192]
-
blk.75.attn_q.weightQ4_0[8192 8192]
-
blk.75.attn_v.weightQ4_0[8192 1024]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.ffn_down.weightQ4_0[28672 8192]
-
blk.76.ffn_gate.weightQ4_0[8192 28672]
-
blk.76.ffn_up.weightQ4_0[8192 28672]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.attn_k.weightQ4_0[8192 1024]
-
blk.76.attn_output.weightQ4_0[8192 8192]
-
blk.76.attn_q.weightQ4_0[8192 8192]
-
blk.76.attn_v.weightQ4_0[8192 1024]
-
blk.77.attn_k.weightQ4_0[8192 1024]
-
blk.77.attn_q.weightQ4_0[8192 8192]
-
blk.77.attn_v.weightQ4_0[8192 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.ffn_down.weightQ4_0[28672 8192]
-
blk.77.ffn_gate.weightQ4_0[8192 28672]
-
blk.77.ffn_up.weightQ4_0[8192 28672]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.attn_output.weightQ4_0[8192 8192]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.ffn_down.weightQ4_0[28672 8192]
-
blk.78.ffn_gate.weightQ4_0[8192 28672]
-
blk.78.ffn_up.weightQ4_0[8192 28672]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.78.attn_k.weightQ4_0[8192 1024]
-
blk.78.attn_output.weightQ4_0[8192 8192]
-
blk.78.attn_q.weightQ4_0[8192 8192]
-
blk.78.attn_v.weightQ4_0[8192 1024]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.ffn_down.weightQ4_0[28672 8192]
-
blk.79.ffn_gate.weightQ4_0[8192 28672]
-
blk.79.ffn_up.weightQ4_0[8192 28672]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.79.attn_k.weightQ4_0[8192 1024]
-
blk.79.attn_output.weightQ4_0[8192 8192]
-
blk.79.attn_q.weightQ4_0[8192 8192]
-
blk.79.attn_v.weightQ4_0[8192 1024]
-
output_norm.weightF32[8192]
-
output.weightQ6_K[8192 128256]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79