latest
19GB
34B
524 Pulls Updated 10 months ago
362afdd3a312 · 19GB
-
general.architecturellama
-
general.file_typeQ4_0
-
llama.attention.head_count64
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count48
-
llama.context_length16384
-
llama.embedding_length8192
-
llama.feed_forward_length22016
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+06
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id2
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[2 3 3 6 6 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> <0x00> <0x01> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ4_0[8192 32000]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.ffn_down.weightQ4_0[22016 8192]
-
blk.0.ffn_gate.weightQ4_0[8192 22016]
-
blk.0.ffn_up.weightQ4_0[8192 22016]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.attn_k.weightQ4_0[8192 1024]
-
blk.0.attn_output.weightQ4_0[8192 8192]
-
blk.0.attn_q.weightQ4_0[8192 8192]
-
blk.0.attn_v.weightQ4_0[8192 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.ffn_down.weightQ4_0[22016 8192]
-
blk.1.ffn_gate.weightQ4_0[8192 22016]
-
blk.1.ffn_up.weightQ4_0[8192 22016]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.1.attn_k.weightQ4_0[8192 1024]
-
blk.1.attn_output.weightQ4_0[8192 8192]
-
blk.1.attn_q.weightQ4_0[8192 8192]
-
blk.1.attn_v.weightQ4_0[8192 1024]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.ffn_down.weightQ4_0[22016 8192]
-
blk.2.ffn_gate.weightQ4_0[8192 22016]
-
blk.2.ffn_up.weightQ4_0[8192 22016]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.2.attn_k.weightQ4_0[8192 1024]
-
blk.2.attn_output.weightQ4_0[8192 8192]
-
blk.2.attn_q.weightQ4_0[8192 8192]
-
blk.2.attn_v.weightQ4_0[8192 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.ffn_down.weightQ4_0[22016 8192]
-
blk.3.ffn_gate.weightQ4_0[8192 22016]
-
blk.3.ffn_up.weightQ4_0[8192 22016]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.3.attn_k.weightQ4_0[8192 1024]
-
blk.3.attn_output.weightQ4_0[8192 8192]
-
blk.3.attn_q.weightQ4_0[8192 8192]
-
blk.3.attn_v.weightQ4_0[8192 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.ffn_down.weightQ4_0[22016 8192]
-
blk.4.ffn_gate.weightQ4_0[8192 22016]
-
blk.4.ffn_up.weightQ4_0[8192 22016]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.4.attn_k.weightQ4_0[8192 1024]
-
blk.4.attn_output.weightQ4_0[8192 8192]
-
blk.4.attn_q.weightQ4_0[8192 8192]
-
blk.4.attn_v.weightQ4_0[8192 1024]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.ffn_down.weightQ4_0[22016 8192]
-
blk.5.ffn_gate.weightQ4_0[8192 22016]
-
blk.5.ffn_up.weightQ4_0[8192 22016]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.5.attn_k.weightQ4_0[8192 1024]
-
blk.5.attn_output.weightQ4_0[8192 8192]
-
blk.5.attn_q.weightQ4_0[8192 8192]
-
blk.5.attn_v.weightQ4_0[8192 1024]
-
blk.6.attn_k.weightQ4_0[8192 1024]
-
blk.6.attn_q.weightQ4_0[8192 8192]
-
blk.6.attn_v.weightQ4_0[8192 1024]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.ffn_down.weightQ4_0[22016 8192]
-
blk.6.ffn_gate.weightQ4_0[8192 22016]
-
blk.6.ffn_up.weightQ4_0[8192 22016]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.6.attn_output.weightQ4_0[8192 8192]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.ffn_down.weightQ4_0[22016 8192]
-
blk.7.ffn_gate.weightQ4_0[8192 22016]
-
blk.7.ffn_up.weightQ4_0[8192 22016]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.7.attn_k.weightQ4_0[8192 1024]
-
blk.7.attn_output.weightQ4_0[8192 8192]
-
blk.7.attn_q.weightQ4_0[8192 8192]
-
blk.7.attn_v.weightQ4_0[8192 1024]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.ffn_down.weightQ4_0[22016 8192]
-
blk.8.ffn_gate.weightQ4_0[8192 22016]
-
blk.8.ffn_up.weightQ4_0[8192 22016]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.attn_k.weightQ4_0[8192 1024]
-
blk.8.attn_output.weightQ4_0[8192 8192]
-
blk.8.attn_q.weightQ4_0[8192 8192]
-
blk.8.attn_v.weightQ4_0[8192 1024]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.ffn_down.weightQ4_0[22016 8192]
-
blk.9.ffn_gate.weightQ4_0[8192 22016]
-
blk.9.ffn_up.weightQ4_0[8192 22016]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.attn_k.weightQ4_0[8192 1024]
-
blk.9.attn_output.weightQ4_0[8192 8192]
-
blk.9.attn_q.weightQ4_0[8192 8192]
-
blk.9.attn_v.weightQ4_0[8192 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.ffn_down.weightQ4_0[22016 8192]
-
blk.10.ffn_gate.weightQ4_0[8192 22016]
-
blk.10.ffn_up.weightQ4_0[8192 22016]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.10.attn_k.weightQ4_0[8192 1024]
-
blk.10.attn_output.weightQ4_0[8192 8192]
-
blk.10.attn_q.weightQ4_0[8192 8192]
-
blk.10.attn_v.weightQ4_0[8192 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.ffn_down.weightQ4_0[22016 8192]
-
blk.11.ffn_gate.weightQ4_0[8192 22016]
-
blk.11.ffn_up.weightQ4_0[8192 22016]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.11.attn_k.weightQ4_0[8192 1024]
-
blk.11.attn_output.weightQ4_0[8192 8192]
-
blk.11.attn_q.weightQ4_0[8192 8192]
-
blk.11.attn_v.weightQ4_0[8192 1024]
-
blk.12.ffn_gate.weightQ4_0[8192 22016]
-
blk.12.attn_k.weightQ4_0[8192 1024]
-
blk.12.attn_output.weightQ4_0[8192 8192]
-
blk.12.attn_q.weightQ4_0[8192 8192]
-
blk.12.attn_v.weightQ4_0[8192 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.ffn_down.weightQ4_0[22016 8192]
-
blk.12.ffn_up.weightQ4_0[8192 22016]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.ffn_down.weightQ4_0[22016 8192]
-
blk.13.ffn_gate.weightQ4_0[8192 22016]
-
blk.13.ffn_up.weightQ4_0[8192 22016]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.13.attn_k.weightQ4_0[8192 1024]
-
blk.13.attn_output.weightQ4_0[8192 8192]
-
blk.13.attn_q.weightQ4_0[8192 8192]
-
blk.13.attn_v.weightQ4_0[8192 1024]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.ffn_down.weightQ4_0[22016 8192]
-
blk.14.ffn_gate.weightQ4_0[8192 22016]
-
blk.14.ffn_up.weightQ4_0[8192 22016]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.14.attn_k.weightQ4_0[8192 1024]
-
blk.14.attn_output.weightQ4_0[8192 8192]
-
blk.14.attn_q.weightQ4_0[8192 8192]
-
blk.14.attn_v.weightQ4_0[8192 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.ffn_down.weightQ4_0[22016 8192]
-
blk.15.ffn_gate.weightQ4_0[8192 22016]
-
blk.15.ffn_up.weightQ4_0[8192 22016]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.15.attn_k.weightQ4_0[8192 1024]
-
blk.15.attn_output.weightQ4_0[8192 8192]
-
blk.15.attn_q.weightQ4_0[8192 8192]
-
blk.15.attn_v.weightQ4_0[8192 1024]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.ffn_down.weightQ4_0[22016 8192]
-
blk.16.ffn_gate.weightQ4_0[8192 22016]
-
blk.16.ffn_up.weightQ4_0[8192 22016]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.16.attn_k.weightQ4_0[8192 1024]
-
blk.16.attn_output.weightQ4_0[8192 8192]
-
blk.16.attn_q.weightQ4_0[8192 8192]
-
blk.16.attn_v.weightQ4_0[8192 1024]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.ffn_down.weightQ4_0[22016 8192]
-
blk.17.ffn_gate.weightQ4_0[8192 22016]
-
blk.17.ffn_up.weightQ4_0[8192 22016]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.17.attn_k.weightQ4_0[8192 1024]
-
blk.17.attn_output.weightQ4_0[8192 8192]
-
blk.17.attn_q.weightQ4_0[8192 8192]
-
blk.17.attn_v.weightQ4_0[8192 1024]
-
blk.18.ffn_gate.weightQ4_0[8192 22016]
-
blk.18.ffn_up.weightQ4_0[8192 22016]
-
blk.18.attn_k.weightQ4_0[8192 1024]
-
blk.18.attn_output.weightQ4_0[8192 8192]
-
blk.18.attn_q.weightQ4_0[8192 8192]
-
blk.18.attn_v.weightQ4_0[8192 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.ffn_down.weightQ4_0[22016 8192]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.ffn_down.weightQ4_0[22016 8192]
-
blk.19.ffn_gate.weightQ4_0[8192 22016]
-
blk.19.ffn_up.weightQ4_0[8192 22016]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.19.attn_k.weightQ4_0[8192 1024]
-
blk.19.attn_output.weightQ4_0[8192 8192]
-
blk.19.attn_q.weightQ4_0[8192 8192]
-
blk.19.attn_v.weightQ4_0[8192 1024]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.ffn_down.weightQ4_0[22016 8192]
-
blk.20.ffn_gate.weightQ4_0[8192 22016]
-
blk.20.ffn_up.weightQ4_0[8192 22016]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.20.attn_k.weightQ4_0[8192 1024]
-
blk.20.attn_output.weightQ4_0[8192 8192]
-
blk.20.attn_q.weightQ4_0[8192 8192]
-
blk.20.attn_v.weightQ4_0[8192 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.ffn_down.weightQ4_0[22016 8192]
-
blk.21.ffn_gate.weightQ4_0[8192 22016]
-
blk.21.ffn_up.weightQ4_0[8192 22016]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.attn_k.weightQ4_0[8192 1024]
-
blk.21.attn_output.weightQ4_0[8192 8192]
-
blk.21.attn_q.weightQ4_0[8192 8192]
-
blk.21.attn_v.weightQ4_0[8192 1024]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.ffn_down.weightQ4_0[22016 8192]
-
blk.22.ffn_gate.weightQ4_0[8192 22016]
-
blk.22.ffn_up.weightQ4_0[8192 22016]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.22.attn_k.weightQ4_0[8192 1024]
-
blk.22.attn_output.weightQ4_0[8192 8192]
-
blk.22.attn_q.weightQ4_0[8192 8192]
-
blk.22.attn_v.weightQ4_0[8192 1024]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.ffn_down.weightQ4_0[22016 8192]
-
blk.23.ffn_gate.weightQ4_0[8192 22016]
-
blk.23.ffn_up.weightQ4_0[8192 22016]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.23.attn_k.weightQ4_0[8192 1024]
-
blk.23.attn_output.weightQ4_0[8192 8192]
-
blk.23.attn_q.weightQ4_0[8192 8192]
-
blk.23.attn_v.weightQ4_0[8192 1024]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.ffn_down.weightQ4_0[22016 8192]
-
blk.24.ffn_gate.weightQ4_0[8192 22016]
-
blk.24.ffn_up.weightQ4_0[8192 22016]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.attn_k.weightQ4_0[8192 1024]
-
blk.24.attn_output.weightQ4_0[8192 8192]
-
blk.24.attn_q.weightQ4_0[8192 8192]
-
blk.24.attn_v.weightQ4_0[8192 1024]
-
blk.25.attn_k.weightQ4_0[8192 1024]
-
blk.25.attn_output.weightQ4_0[8192 8192]
-
blk.25.attn_q.weightQ4_0[8192 8192]
-
blk.25.attn_v.weightQ4_0[8192 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.ffn_down.weightQ4_0[22016 8192]
-
blk.25.ffn_gate.weightQ4_0[8192 22016]
-
blk.25.ffn_up.weightQ4_0[8192 22016]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.ffn_down.weightQ4_0[22016 8192]
-
blk.26.ffn_gate.weightQ4_0[8192 22016]
-
blk.26.ffn_up.weightQ4_0[8192 22016]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.26.attn_k.weightQ4_0[8192 1024]
-
blk.26.attn_output.weightQ4_0[8192 8192]
-
blk.26.attn_q.weightQ4_0[8192 8192]
-
blk.26.attn_v.weightQ4_0[8192 1024]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.ffn_down.weightQ4_0[22016 8192]
-
blk.27.ffn_gate.weightQ4_0[8192 22016]
-
blk.27.ffn_up.weightQ4_0[8192 22016]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.27.attn_k.weightQ4_0[8192 1024]
-
blk.27.attn_output.weightQ4_0[8192 8192]
-
blk.27.attn_q.weightQ4_0[8192 8192]
-
blk.27.attn_v.weightQ4_0[8192 1024]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.ffn_down.weightQ4_0[22016 8192]
-
blk.28.ffn_gate.weightQ4_0[8192 22016]
-
blk.28.ffn_up.weightQ4_0[8192 22016]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.attn_k.weightQ4_0[8192 1024]
-
blk.28.attn_output.weightQ4_0[8192 8192]
-
blk.28.attn_q.weightQ4_0[8192 8192]
-
blk.28.attn_v.weightQ4_0[8192 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.ffn_down.weightQ4_0[22016 8192]
-
blk.29.ffn_gate.weightQ4_0[8192 22016]
-
blk.29.ffn_up.weightQ4_0[8192 22016]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.29.attn_k.weightQ4_0[8192 1024]
-
blk.29.attn_output.weightQ4_0[8192 8192]
-
blk.29.attn_q.weightQ4_0[8192 8192]
-
blk.29.attn_v.weightQ4_0[8192 1024]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.ffn_down.weightQ4_0[22016 8192]
-
blk.30.ffn_gate.weightQ4_0[8192 22016]
-
blk.30.ffn_up.weightQ4_0[8192 22016]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.30.attn_k.weightQ4_0[8192 1024]
-
blk.30.attn_output.weightQ4_0[8192 8192]
-
blk.30.attn_q.weightQ4_0[8192 8192]
-
blk.30.attn_v.weightQ4_0[8192 1024]
-
blk.31.ffn_gate.weightQ4_0[8192 22016]
-
blk.31.attn_k.weightQ4_0[8192 1024]
-
blk.31.attn_output.weightQ4_0[8192 8192]
-
blk.31.attn_q.weightQ4_0[8192 8192]
-
blk.31.attn_v.weightQ4_0[8192 1024]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.ffn_down.weightQ4_0[22016 8192]
-
blk.31.ffn_up.weightQ4_0[8192 22016]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.ffn_down.weightQ4_0[22016 8192]
-
blk.32.ffn_gate.weightQ4_0[8192 22016]
-
blk.32.ffn_up.weightQ4_0[8192 22016]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.32.attn_k.weightQ4_0[8192 1024]
-
blk.32.attn_output.weightQ4_0[8192 8192]
-
blk.32.attn_q.weightQ4_0[8192 8192]
-
blk.32.attn_v.weightQ4_0[8192 1024]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.ffn_down.weightQ4_0[22016 8192]
-
blk.33.ffn_gate.weightQ4_0[8192 22016]
-
blk.33.ffn_up.weightQ4_0[8192 22016]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.33.attn_k.weightQ4_0[8192 1024]
-
blk.33.attn_output.weightQ4_0[8192 8192]
-
blk.33.attn_q.weightQ4_0[8192 8192]
-
blk.33.attn_v.weightQ4_0[8192 1024]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.ffn_down.weightQ4_0[22016 8192]
-
blk.34.ffn_gate.weightQ4_0[8192 22016]
-
blk.34.ffn_up.weightQ4_0[8192 22016]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.34.attn_k.weightQ4_0[8192 1024]
-
blk.34.attn_output.weightQ4_0[8192 8192]
-
blk.34.attn_q.weightQ4_0[8192 8192]
-
blk.34.attn_v.weightQ4_0[8192 1024]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.ffn_down.weightQ4_0[22016 8192]
-
blk.35.ffn_gate.weightQ4_0[8192 22016]
-
blk.35.ffn_up.weightQ4_0[8192 22016]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.35.attn_k.weightQ4_0[8192 1024]
-
blk.35.attn_output.weightQ4_0[8192 8192]
-
blk.35.attn_q.weightQ4_0[8192 8192]
-
blk.35.attn_v.weightQ4_0[8192 1024]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.ffn_down.weightQ4_0[22016 8192]
-
blk.36.ffn_gate.weightQ4_0[8192 22016]
-
blk.36.ffn_up.weightQ4_0[8192 22016]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.attn_k.weightQ4_0[8192 1024]
-
blk.36.attn_output.weightQ4_0[8192 8192]
-
blk.36.attn_q.weightQ4_0[8192 8192]
-
blk.36.attn_v.weightQ4_0[8192 1024]
-
blk.37.ffn_gate.weightQ4_0[8192 22016]
-
blk.37.ffn_up.weightQ4_0[8192 22016]
-
blk.37.attn_k.weightQ4_0[8192 1024]
-
blk.37.attn_output.weightQ4_0[8192 8192]
-
blk.37.attn_q.weightQ4_0[8192 8192]
-
blk.37.attn_v.weightQ4_0[8192 1024]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.ffn_down.weightQ4_0[22016 8192]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.ffn_down.weightQ4_0[22016 8192]
-
blk.38.ffn_gate.weightQ4_0[8192 22016]
-
blk.38.ffn_up.weightQ4_0[8192 22016]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.38.attn_k.weightQ4_0[8192 1024]
-
blk.38.attn_output.weightQ4_0[8192 8192]
-
blk.38.attn_q.weightQ4_0[8192 8192]
-
blk.38.attn_v.weightQ4_0[8192 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.ffn_down.weightQ4_0[22016 8192]
-
blk.39.ffn_gate.weightQ4_0[8192 22016]
-
blk.39.ffn_up.weightQ4_0[8192 22016]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.39.attn_k.weightQ4_0[8192 1024]
-
blk.39.attn_output.weightQ4_0[8192 8192]
-
blk.39.attn_q.weightQ4_0[8192 8192]
-
blk.39.attn_v.weightQ4_0[8192 1024]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.ffn_down.weightQ4_0[22016 8192]
-
blk.40.ffn_gate.weightQ4_0[8192 22016]
-
blk.40.ffn_up.weightQ4_0[8192 22016]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.40.attn_k.weightQ4_0[8192 1024]
-
blk.40.attn_output.weightQ4_0[8192 8192]
-
blk.40.attn_q.weightQ4_0[8192 8192]
-
blk.40.attn_v.weightQ4_0[8192 1024]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.ffn_down.weightQ4_0[22016 8192]
-
blk.41.ffn_gate.weightQ4_0[8192 22016]
-
blk.41.ffn_up.weightQ4_0[8192 22016]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.41.attn_k.weightQ4_0[8192 1024]
-
blk.41.attn_output.weightQ4_0[8192 8192]
-
blk.41.attn_q.weightQ4_0[8192 8192]
-
blk.41.attn_v.weightQ4_0[8192 1024]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.ffn_down.weightQ4_0[22016 8192]
-
blk.42.ffn_gate.weightQ4_0[8192 22016]
-
blk.42.ffn_up.weightQ4_0[8192 22016]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.42.attn_k.weightQ4_0[8192 1024]
-
blk.42.attn_output.weightQ4_0[8192 8192]
-
blk.42.attn_q.weightQ4_0[8192 8192]
-
blk.42.attn_v.weightQ4_0[8192 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.ffn_down.weightQ4_0[22016 8192]
-
blk.43.ffn_gate.weightQ4_0[8192 22016]
-
blk.43.ffn_up.weightQ4_0[8192 22016]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.43.attn_k.weightQ4_0[8192 1024]
-
blk.43.attn_output.weightQ4_0[8192 8192]
-
blk.43.attn_q.weightQ4_0[8192 8192]
-
blk.43.attn_v.weightQ4_0[8192 1024]
-
blk.44.attn_k.weightQ4_0[8192 1024]
-
blk.44.attn_output.weightQ4_0[8192 8192]
-
blk.44.attn_q.weightQ4_0[8192 8192]
-
blk.44.attn_v.weightQ4_0[8192 1024]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.ffn_down.weightQ4_0[22016 8192]
-
blk.44.ffn_gate.weightQ4_0[8192 22016]
-
blk.44.ffn_up.weightQ4_0[8192 22016]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.ffn_down.weightQ4_0[22016 8192]
-
blk.45.ffn_gate.weightQ4_0[8192 22016]
-
blk.45.ffn_up.weightQ4_0[8192 22016]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.attn_k.weightQ4_0[8192 1024]
-
blk.45.attn_output.weightQ4_0[8192 8192]
-
blk.45.attn_q.weightQ4_0[8192 8192]
-
blk.45.attn_v.weightQ4_0[8192 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.ffn_down.weightQ4_0[22016 8192]
-
blk.46.ffn_gate.weightQ4_0[8192 22016]
-
blk.46.ffn_up.weightQ4_0[8192 22016]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.46.attn_k.weightQ4_0[8192 1024]
-
blk.46.attn_output.weightQ4_0[8192 8192]
-
blk.46.attn_q.weightQ4_0[8192 8192]
-
blk.46.attn_v.weightQ4_0[8192 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.ffn_down.weightQ4_0[22016 8192]
-
blk.47.ffn_gate.weightQ4_0[8192 22016]
-
blk.47.ffn_up.weightQ4_0[8192 22016]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.47.attn_k.weightQ4_0[8192 1024]
-
blk.47.attn_output.weightQ4_0[8192 8192]
-
blk.47.attn_q.weightQ4_0[8192 8192]
-
blk.47.attn_v.weightQ4_0[8192 1024]
-
output.weightQ6_K[8192 32000]
-
output_norm.weightF32[8192]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47