latest
9.9GB
imatrix quants of deepseek-coder
33B
38 Pulls Updated 6 months ago
175fb8c0ac4c · 13GB
-
general.architecturellama
-
general.file_typeIQ3_XXS
-
llama.attention.head_count56
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-06
-
llama.block_count62
-
llama.context_length16384
-
llama.embedding_length7168
-
llama.feed_forward_length19200
-
llama.rope.dimension_count128
-
llama.rope.freq_base100000
-
llama.rope.scaling.factor4
-
llama.rope.scaling.typelinear
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id32013
-
tokenizer.ggml.eos_token_id32021
-
tokenizer.ggml.merges[Ġ Ġ Ġ t Ġ a i n h e ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id32014
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weightQ4_K[7168 32256]
-
blk.0.attn_q.weightI32[7168 7168]
-
blk.0.attn_k.weightI32[7168 1024]
-
blk.0.attn_v.weightQ4_K[7168 1024]
-
blk.0.attn_output.weightQ3_K[7168 7168]
-
blk.0.ffn_gate.weightI32[7168 19200]
-
blk.0.ffn_up.weightI32[7168 19200]
-
blk.0.ffn_down.weightI32[19200 7168]
-
blk.0.attn_norm.weightF32[7168]
-
blk.0.ffn_norm.weightF32[7168]
-
blk.1.attn_q.weightI32[7168 7168]
-
blk.1.attn_k.weightI32[7168 1024]
-
blk.1.attn_v.weightQ4_K[7168 1024]
-
blk.1.attn_output.weightQ3_K[7168 7168]
-
blk.1.ffn_gate.weightI32[7168 19200]
-
blk.1.ffn_up.weightI32[7168 19200]
-
blk.1.ffn_down.weightI32[19200 7168]
-
blk.1.attn_norm.weightF32[7168]
-
blk.1.ffn_norm.weightF32[7168]
-
blk.2.attn_q.weightI32[7168 7168]
-
blk.2.attn_k.weightI32[7168 1024]
-
blk.2.attn_v.weightQ4_K[7168 1024]
-
blk.2.attn_output.weightQ3_K[7168 7168]
-
blk.2.ffn_gate.weightI32[7168 19200]
-
blk.2.ffn_up.weightI32[7168 19200]
-
blk.2.ffn_down.weightI32[19200 7168]
-
blk.2.attn_norm.weightF32[7168]
-
blk.2.ffn_norm.weightF32[7168]
-
blk.3.attn_q.weightI32[7168 7168]
-
blk.3.attn_k.weightI32[7168 1024]
-
blk.3.attn_v.weightQ4_K[7168 1024]
-
blk.3.attn_output.weightQ3_K[7168 7168]
-
blk.3.ffn_gate.weightI32[7168 19200]
-
blk.3.ffn_up.weightI32[7168 19200]
-
blk.3.ffn_down.weightI32[19200 7168]
-
blk.3.attn_norm.weightF32[7168]
-
blk.3.ffn_norm.weightF32[7168]
-
blk.4.attn_q.weightI32[7168 7168]
-
blk.4.attn_k.weightI32[7168 1024]
-
blk.4.attn_v.weightQ4_K[7168 1024]
-
blk.4.attn_output.weightQ3_K[7168 7168]
-
blk.4.ffn_gate.weightI32[7168 19200]
-
blk.4.ffn_up.weightI32[7168 19200]
-
blk.4.ffn_down.weightI32[19200 7168]
-
blk.4.attn_norm.weightF32[7168]
-
blk.4.ffn_norm.weightF32[7168]
-
blk.5.attn_q.weightI32[7168 7168]
-
blk.5.attn_k.weightI32[7168 1024]
-
blk.5.attn_v.weightQ4_K[7168 1024]
-
blk.5.attn_output.weightQ3_K[7168 7168]
-
blk.5.ffn_gate.weightI32[7168 19200]
-
blk.5.ffn_up.weightI32[7168 19200]
-
blk.5.ffn_down.weightI32[19200 7168]
-
blk.5.attn_norm.weightF32[7168]
-
blk.5.ffn_norm.weightF32[7168]
-
blk.6.attn_q.weightI32[7168 7168]
-
blk.6.attn_k.weightI32[7168 1024]
-
blk.6.attn_v.weightQ4_K[7168 1024]
-
blk.6.attn_output.weightQ3_K[7168 7168]
-
blk.6.ffn_gate.weightI32[7168 19200]
-
blk.6.ffn_up.weightI32[7168 19200]
-
blk.6.ffn_down.weightI32[19200 7168]
-
blk.6.attn_norm.weightF32[7168]
-
blk.6.ffn_norm.weightF32[7168]
-
blk.7.attn_q.weightI32[7168 7168]
-
blk.7.attn_k.weightI32[7168 1024]
-
blk.7.attn_v.weightQ4_K[7168 1024]
-
blk.7.attn_output.weightQ3_K[7168 7168]
-
blk.7.ffn_gate.weightI32[7168 19200]
-
blk.7.ffn_up.weightI32[7168 19200]
-
blk.7.ffn_down.weightI32[19200 7168]
-
blk.7.attn_norm.weightF32[7168]
-
blk.7.ffn_norm.weightF32[7168]
-
blk.8.attn_q.weightI32[7168 7168]
-
blk.8.attn_k.weightI32[7168 1024]
-
blk.8.attn_v.weightQ4_K[7168 1024]
-
blk.8.attn_output.weightQ3_K[7168 7168]
-
blk.8.ffn_gate.weightI32[7168 19200]
-
blk.8.ffn_up.weightI32[7168 19200]
-
blk.8.ffn_down.weightI32[19200 7168]
-
blk.8.attn_norm.weightF32[7168]
-
blk.8.ffn_norm.weightF32[7168]
-
blk.9.attn_q.weightI32[7168 7168]
-
blk.9.attn_k.weightI32[7168 1024]
-
blk.9.attn_v.weightQ4_K[7168 1024]
-
blk.9.attn_output.weightQ3_K[7168 7168]
-
blk.9.ffn_gate.weightI32[7168 19200]
-
blk.9.ffn_up.weightI32[7168 19200]
-
blk.9.ffn_down.weightI32[19200 7168]
-
blk.9.attn_norm.weightF32[7168]
-
blk.9.ffn_norm.weightF32[7168]
-
blk.10.attn_q.weightI32[7168 7168]
-
blk.10.attn_k.weightI32[7168 1024]
-
blk.10.attn_v.weightQ4_K[7168 1024]
-
blk.10.attn_output.weightQ3_K[7168 7168]
-
blk.10.ffn_gate.weightI32[7168 19200]
-
blk.10.ffn_up.weightI32[7168 19200]
-
blk.10.ffn_down.weightI32[19200 7168]
-
blk.10.attn_norm.weightF32[7168]
-
blk.10.ffn_norm.weightF32[7168]
-
blk.11.attn_q.weightI32[7168 7168]
-
blk.11.attn_k.weightI32[7168 1024]
-
blk.11.attn_v.weightQ4_K[7168 1024]
-
blk.11.attn_output.weightQ3_K[7168 7168]
-
blk.11.ffn_gate.weightI32[7168 19200]
-
blk.11.ffn_up.weightI32[7168 19200]
-
blk.11.ffn_down.weightI32[19200 7168]
-
blk.11.attn_norm.weightF32[7168]
-
blk.11.ffn_norm.weightF32[7168]
-
blk.12.attn_q.weightI32[7168 7168]
-
blk.12.attn_k.weightI32[7168 1024]
-
blk.12.attn_v.weightQ4_K[7168 1024]
-
blk.12.attn_output.weightQ3_K[7168 7168]
-
blk.12.ffn_gate.weightI32[7168 19200]
-
blk.12.ffn_up.weightI32[7168 19200]
-
blk.12.ffn_down.weightI32[19200 7168]
-
blk.12.attn_norm.weightF32[7168]
-
blk.12.ffn_norm.weightF32[7168]
-
blk.13.attn_q.weightI32[7168 7168]
-
blk.13.attn_k.weightI32[7168 1024]
-
blk.13.attn_v.weightQ4_K[7168 1024]
-
blk.13.attn_output.weightQ3_K[7168 7168]
-
blk.13.ffn_gate.weightI32[7168 19200]
-
blk.13.ffn_up.weightI32[7168 19200]
-
blk.13.ffn_down.weightI32[19200 7168]
-
blk.13.attn_norm.weightF32[7168]
-
blk.13.ffn_norm.weightF32[7168]
-
blk.14.attn_q.weightI32[7168 7168]
-
blk.14.attn_k.weightI32[7168 1024]
-
blk.14.attn_v.weightQ4_K[7168 1024]
-
blk.14.attn_output.weightQ3_K[7168 7168]
-
blk.14.ffn_gate.weightI32[7168 19200]
-
blk.14.ffn_up.weightI32[7168 19200]
-
blk.14.ffn_down.weightI32[19200 7168]
-
blk.14.attn_norm.weightF32[7168]
-
blk.14.ffn_norm.weightF32[7168]
-
blk.15.attn_q.weightI32[7168 7168]
-
blk.15.attn_k.weightI32[7168 1024]
-
blk.15.attn_v.weightQ4_K[7168 1024]
-
blk.15.attn_output.weightQ3_K[7168 7168]
-
blk.15.ffn_gate.weightI32[7168 19200]
-
blk.15.ffn_up.weightI32[7168 19200]
-
blk.15.ffn_down.weightI32[19200 7168]
-
blk.15.attn_norm.weightF32[7168]
-
blk.15.ffn_norm.weightF32[7168]
-
blk.16.attn_q.weightI32[7168 7168]
-
blk.16.attn_k.weightI32[7168 1024]
-
blk.16.attn_v.weightQ4_K[7168 1024]
-
blk.16.attn_output.weightQ3_K[7168 7168]
-
blk.16.ffn_gate.weightI32[7168 19200]
-
blk.16.ffn_up.weightI32[7168 19200]
-
blk.16.ffn_down.weightI32[19200 7168]
-
blk.16.attn_norm.weightF32[7168]
-
blk.16.ffn_norm.weightF32[7168]
-
blk.17.attn_q.weightI32[7168 7168]
-
blk.17.attn_k.weightI32[7168 1024]
-
blk.17.attn_v.weightQ4_K[7168 1024]
-
blk.17.attn_output.weightQ3_K[7168 7168]
-
blk.17.ffn_gate.weightI32[7168 19200]
-
blk.17.ffn_up.weightI32[7168 19200]
-
blk.17.ffn_down.weightI32[19200 7168]
-
blk.17.attn_norm.weightF32[7168]
-
blk.17.ffn_norm.weightF32[7168]
-
blk.18.attn_q.weightI32[7168 7168]
-
blk.18.attn_k.weightI32[7168 1024]
-
blk.18.attn_v.weightQ4_K[7168 1024]
-
blk.18.attn_output.weightQ3_K[7168 7168]
-
blk.18.ffn_gate.weightI32[7168 19200]
-
blk.18.ffn_up.weightI32[7168 19200]
-
blk.18.ffn_down.weightI32[19200 7168]
-
blk.18.attn_norm.weightF32[7168]
-
blk.18.ffn_norm.weightF32[7168]
-
blk.19.attn_q.weightI32[7168 7168]
-
blk.19.attn_k.weightI32[7168 1024]
-
blk.19.attn_v.weightQ4_K[7168 1024]
-
blk.19.attn_output.weightQ3_K[7168 7168]
-
blk.19.ffn_gate.weightI32[7168 19200]
-
blk.19.ffn_up.weightI32[7168 19200]
-
blk.19.ffn_down.weightI32[19200 7168]
-
blk.19.attn_norm.weightF32[7168]
-
blk.19.ffn_norm.weightF32[7168]
-
blk.20.attn_q.weightI32[7168 7168]
-
blk.20.attn_k.weightI32[7168 1024]
-
blk.20.attn_v.weightQ4_K[7168 1024]
-
blk.20.attn_output.weightQ3_K[7168 7168]
-
blk.20.ffn_gate.weightI32[7168 19200]
-
blk.20.ffn_up.weightI32[7168 19200]
-
blk.20.ffn_down.weightI32[19200 7168]
-
blk.20.attn_norm.weightF32[7168]
-
blk.20.ffn_norm.weightF32[7168]
-
blk.21.attn_q.weightI32[7168 7168]
-
blk.21.attn_k.weightI32[7168 1024]
-
blk.21.attn_v.weightQ4_K[7168 1024]
-
blk.21.attn_output.weightQ3_K[7168 7168]
-
blk.21.ffn_gate.weightI32[7168 19200]
-
blk.21.ffn_up.weightI32[7168 19200]
-
blk.21.ffn_down.weightI32[19200 7168]
-
blk.21.attn_norm.weightF32[7168]
-
blk.21.ffn_norm.weightF32[7168]
-
blk.22.attn_q.weightI32[7168 7168]
-
blk.22.attn_k.weightI32[7168 1024]
-
blk.22.attn_v.weightQ4_K[7168 1024]
-
blk.22.attn_output.weightQ3_K[7168 7168]
-
blk.22.ffn_gate.weightI32[7168 19200]
-
blk.22.ffn_up.weightI32[7168 19200]
-
blk.22.ffn_down.weightI32[19200 7168]
-
blk.22.attn_norm.weightF32[7168]
-
blk.22.ffn_norm.weightF32[7168]
-
blk.23.attn_q.weightI32[7168 7168]
-
blk.23.attn_k.weightI32[7168 1024]
-
blk.23.attn_v.weightQ4_K[7168 1024]
-
blk.23.attn_output.weightQ3_K[7168 7168]
-
blk.23.ffn_gate.weightI32[7168 19200]
-
blk.23.ffn_up.weightI32[7168 19200]
-
blk.23.ffn_down.weightI32[19200 7168]
-
blk.23.attn_norm.weightF32[7168]
-
blk.23.ffn_norm.weightF32[7168]
-
blk.24.attn_q.weightI32[7168 7168]
-
blk.24.attn_k.weightI32[7168 1024]
-
blk.24.attn_v.weightQ4_K[7168 1024]
-
blk.24.attn_output.weightQ3_K[7168 7168]
-
blk.24.ffn_gate.weightI32[7168 19200]
-
blk.24.ffn_up.weightI32[7168 19200]
-
blk.24.ffn_down.weightI32[19200 7168]
-
blk.24.attn_norm.weightF32[7168]
-
blk.24.ffn_norm.weightF32[7168]
-
blk.25.attn_q.weightI32[7168 7168]
-
blk.25.attn_k.weightI32[7168 1024]
-
blk.25.attn_v.weightQ4_K[7168 1024]
-
blk.25.attn_output.weightQ3_K[7168 7168]
-
blk.25.ffn_gate.weightI32[7168 19200]
-
blk.25.ffn_up.weightI32[7168 19200]
-
blk.25.ffn_down.weightI32[19200 7168]
-
blk.25.attn_norm.weightF32[7168]
-
blk.25.ffn_norm.weightF32[7168]
-
blk.26.attn_q.weightI32[7168 7168]
-
blk.26.attn_k.weightI32[7168 1024]
-
blk.26.attn_v.weightQ4_K[7168 1024]
-
blk.26.attn_output.weightQ3_K[7168 7168]
-
blk.26.ffn_gate.weightI32[7168 19200]
-
blk.26.ffn_up.weightI32[7168 19200]
-
blk.26.ffn_down.weightI32[19200 7168]
-
blk.26.attn_norm.weightF32[7168]
-
blk.26.ffn_norm.weightF32[7168]
-
blk.27.attn_q.weightI32[7168 7168]
-
blk.27.attn_k.weightI32[7168 1024]
-
blk.27.attn_v.weightQ4_K[7168 1024]
-
blk.27.attn_output.weightQ3_K[7168 7168]
-
blk.27.ffn_gate.weightI32[7168 19200]
-
blk.27.ffn_up.weightI32[7168 19200]
-
blk.27.ffn_down.weightI32[19200 7168]
-
blk.27.attn_norm.weightF32[7168]
-
blk.27.ffn_norm.weightF32[7168]
-
blk.28.attn_q.weightI32[7168 7168]
-
blk.28.attn_k.weightI32[7168 1024]
-
blk.28.attn_v.weightQ4_K[7168 1024]
-
blk.28.attn_output.weightQ3_K[7168 7168]
-
blk.28.ffn_gate.weightI32[7168 19200]
-
blk.28.ffn_up.weightI32[7168 19200]
-
blk.28.ffn_down.weightI32[19200 7168]
-
blk.28.attn_norm.weightF32[7168]
-
blk.28.ffn_norm.weightF32[7168]
-
blk.29.attn_q.weightI32[7168 7168]
-
blk.29.attn_k.weightI32[7168 1024]
-
blk.29.attn_v.weightQ4_K[7168 1024]
-
blk.29.attn_output.weightQ3_K[7168 7168]
-
blk.29.ffn_gate.weightI32[7168 19200]
-
blk.29.ffn_up.weightI32[7168 19200]
-
blk.29.ffn_down.weightI32[19200 7168]
-
blk.29.attn_norm.weightF32[7168]
-
blk.29.ffn_norm.weightF32[7168]
-
blk.30.attn_q.weightI32[7168 7168]
-
blk.30.attn_k.weightI32[7168 1024]
-
blk.30.attn_v.weightQ4_K[7168 1024]
-
blk.30.attn_output.weightQ3_K[7168 7168]
-
blk.30.ffn_gate.weightI32[7168 19200]
-
blk.30.ffn_up.weightI32[7168 19200]
-
blk.30.ffn_down.weightI32[19200 7168]
-
blk.30.attn_norm.weightF32[7168]
-
blk.30.ffn_norm.weightF32[7168]
-
blk.31.attn_q.weightI32[7168 7168]
-
blk.31.attn_k.weightI32[7168 1024]
-
blk.31.attn_v.weightQ4_K[7168 1024]
-
blk.31.attn_output.weightQ3_K[7168 7168]
-
blk.31.ffn_gate.weightI32[7168 19200]
-
blk.31.ffn_up.weightI32[7168 19200]
-
blk.31.ffn_down.weightI32[19200 7168]
-
blk.31.attn_norm.weightF32[7168]
-
blk.31.ffn_norm.weightF32[7168]
-
blk.32.attn_q.weightI32[7168 7168]
-
blk.32.attn_k.weightI32[7168 1024]
-
blk.32.attn_v.weightQ4_K[7168 1024]
-
blk.32.attn_output.weightQ3_K[7168 7168]
-
blk.32.ffn_gate.weightI32[7168 19200]
-
blk.32.ffn_up.weightI32[7168 19200]
-
blk.32.ffn_down.weightI32[19200 7168]
-
blk.32.attn_norm.weightF32[7168]
-
blk.32.ffn_norm.weightF32[7168]
-
blk.33.attn_q.weightI32[7168 7168]
-
blk.33.attn_k.weightI32[7168 1024]
-
blk.33.attn_v.weightQ4_K[7168 1024]
-
blk.33.attn_output.weightQ3_K[7168 7168]
-
blk.33.ffn_gate.weightI32[7168 19200]
-
blk.33.ffn_up.weightI32[7168 19200]
-
blk.33.ffn_down.weightI32[19200 7168]
-
blk.33.attn_norm.weightF32[7168]
-
blk.33.ffn_norm.weightF32[7168]
-
blk.34.attn_q.weightI32[7168 7168]
-
blk.34.attn_k.weightI32[7168 1024]
-
blk.34.attn_v.weightQ4_K[7168 1024]
-
blk.34.attn_output.weightQ3_K[7168 7168]
-
blk.34.ffn_gate.weightI32[7168 19200]
-
blk.34.ffn_up.weightI32[7168 19200]
-
blk.34.ffn_down.weightI32[19200 7168]
-
blk.34.attn_norm.weightF32[7168]
-
blk.34.ffn_norm.weightF32[7168]
-
blk.35.attn_q.weightI32[7168 7168]
-
blk.35.attn_k.weightI32[7168 1024]
-
blk.35.attn_v.weightQ4_K[7168 1024]
-
blk.35.attn_output.weightQ3_K[7168 7168]
-
blk.35.ffn_gate.weightI32[7168 19200]
-
blk.35.ffn_up.weightI32[7168 19200]
-
blk.35.ffn_down.weightI32[19200 7168]
-
blk.35.attn_norm.weightF32[7168]
-
blk.35.ffn_norm.weightF32[7168]
-
blk.36.attn_q.weightI32[7168 7168]
-
blk.36.attn_k.weightI32[7168 1024]
-
blk.36.attn_v.weightQ4_K[7168 1024]
-
blk.36.attn_output.weightQ3_K[7168 7168]
-
blk.36.ffn_gate.weightI32[7168 19200]
-
blk.36.ffn_up.weightI32[7168 19200]
-
blk.36.ffn_down.weightI32[19200 7168]
-
blk.36.attn_norm.weightF32[7168]
-
blk.36.ffn_norm.weightF32[7168]
-
blk.37.attn_q.weightI32[7168 7168]
-
blk.37.attn_k.weightI32[7168 1024]
-
blk.37.attn_v.weightQ4_K[7168 1024]
-
blk.37.attn_output.weightQ3_K[7168 7168]
-
blk.37.ffn_gate.weightI32[7168 19200]
-
blk.37.ffn_up.weightI32[7168 19200]
-
blk.37.ffn_down.weightI32[19200 7168]
-
blk.37.attn_norm.weightF32[7168]
-
blk.37.ffn_norm.weightF32[7168]
-
blk.38.attn_q.weightI32[7168 7168]
-
blk.38.attn_k.weightI32[7168 1024]
-
blk.38.attn_v.weightQ4_K[7168 1024]
-
blk.38.attn_output.weightQ3_K[7168 7168]
-
blk.38.ffn_gate.weightI32[7168 19200]
-
blk.38.ffn_up.weightI32[7168 19200]
-
blk.38.ffn_down.weightI32[19200 7168]
-
blk.38.attn_norm.weightF32[7168]
-
blk.38.ffn_norm.weightF32[7168]
-
blk.39.attn_q.weightI32[7168 7168]
-
blk.39.attn_k.weightI32[7168 1024]
-
blk.39.attn_v.weightQ4_K[7168 1024]
-
blk.39.attn_output.weightQ3_K[7168 7168]
-
blk.39.ffn_gate.weightI32[7168 19200]
-
blk.39.ffn_up.weightI32[7168 19200]
-
blk.39.ffn_down.weightI32[19200 7168]
-
blk.39.attn_norm.weightF32[7168]
-
blk.39.ffn_norm.weightF32[7168]
-
blk.40.attn_q.weightI32[7168 7168]
-
blk.40.attn_k.weightI32[7168 1024]
-
blk.40.attn_v.weightQ4_K[7168 1024]
-
blk.40.attn_output.weightQ3_K[7168 7168]
-
blk.40.ffn_gate.weightI32[7168 19200]
-
blk.40.ffn_up.weightI32[7168 19200]
-
blk.40.ffn_down.weightI32[19200 7168]
-
blk.40.attn_norm.weightF32[7168]
-
blk.40.ffn_norm.weightF32[7168]
-
blk.41.attn_q.weightI32[7168 7168]
-
blk.41.attn_k.weightI32[7168 1024]
-
blk.41.attn_v.weightQ4_K[7168 1024]
-
blk.41.attn_output.weightQ3_K[7168 7168]
-
blk.41.ffn_gate.weightI32[7168 19200]
-
blk.41.ffn_up.weightI32[7168 19200]
-
blk.41.ffn_down.weightI32[19200 7168]
-
blk.41.attn_norm.weightF32[7168]
-
blk.41.ffn_norm.weightF32[7168]
-
blk.42.attn_q.weightI32[7168 7168]
-
blk.42.attn_k.weightI32[7168 1024]
-
blk.42.attn_v.weightQ4_K[7168 1024]
-
blk.42.attn_output.weightQ3_K[7168 7168]
-
blk.42.ffn_gate.weightI32[7168 19200]
-
blk.42.ffn_up.weightI32[7168 19200]
-
blk.42.ffn_down.weightI32[19200 7168]
-
blk.42.attn_norm.weightF32[7168]
-
blk.42.ffn_norm.weightF32[7168]
-
blk.43.attn_q.weightI32[7168 7168]
-
blk.43.attn_k.weightI32[7168 1024]
-
blk.43.attn_v.weightQ4_K[7168 1024]
-
blk.43.attn_output.weightQ3_K[7168 7168]
-
blk.43.ffn_gate.weightI32[7168 19200]
-
blk.43.ffn_up.weightI32[7168 19200]
-
blk.43.ffn_down.weightI32[19200 7168]
-
blk.43.attn_norm.weightF32[7168]
-
blk.43.ffn_norm.weightF32[7168]
-
blk.44.attn_q.weightI32[7168 7168]
-
blk.44.attn_k.weightI32[7168 1024]
-
blk.44.attn_v.weightQ4_K[7168 1024]
-
blk.44.attn_output.weightQ3_K[7168 7168]
-
blk.44.ffn_gate.weightI32[7168 19200]
-
blk.44.ffn_up.weightI32[7168 19200]
-
blk.44.ffn_down.weightI32[19200 7168]
-
blk.44.attn_norm.weightF32[7168]
-
blk.44.ffn_norm.weightF32[7168]
-
blk.45.attn_q.weightI32[7168 7168]
-
blk.45.attn_k.weightI32[7168 1024]
-
blk.45.attn_v.weightQ4_K[7168 1024]
-
blk.45.attn_output.weightQ3_K[7168 7168]
-
blk.45.ffn_gate.weightI32[7168 19200]
-
blk.45.ffn_up.weightI32[7168 19200]
-
blk.45.ffn_down.weightI32[19200 7168]
-
blk.45.attn_norm.weightF32[7168]
-
blk.45.ffn_norm.weightF32[7168]
-
blk.46.attn_q.weightI32[7168 7168]
-
blk.46.attn_k.weightI32[7168 1024]
-
blk.46.attn_v.weightQ4_K[7168 1024]
-
blk.46.attn_output.weightQ3_K[7168 7168]
-
blk.46.ffn_gate.weightI32[7168 19200]
-
blk.46.ffn_up.weightI32[7168 19200]
-
blk.46.ffn_down.weightI32[19200 7168]
-
blk.46.attn_norm.weightF32[7168]
-
blk.46.ffn_norm.weightF32[7168]
-
blk.47.attn_q.weightI32[7168 7168]
-
blk.47.attn_k.weightI32[7168 1024]
-
blk.47.attn_v.weightQ4_K[7168 1024]
-
blk.47.attn_output.weightQ3_K[7168 7168]
-
blk.47.ffn_gate.weightI32[7168 19200]
-
blk.47.ffn_up.weightI32[7168 19200]
-
blk.47.ffn_down.weightI32[19200 7168]
-
blk.47.attn_norm.weightF32[7168]
-
blk.47.ffn_norm.weightF32[7168]
-
blk.48.attn_q.weightI32[7168 7168]
-
blk.48.attn_k.weightI32[7168 1024]
-
blk.48.attn_v.weightQ4_K[7168 1024]
-
blk.48.attn_output.weightQ3_K[7168 7168]
-
blk.48.ffn_gate.weightI32[7168 19200]
-
blk.48.ffn_up.weightI32[7168 19200]
-
blk.48.ffn_down.weightI32[19200 7168]
-
blk.48.attn_norm.weightF32[7168]
-
blk.48.ffn_norm.weightF32[7168]
-
blk.49.attn_q.weightI32[7168 7168]
-
blk.49.attn_k.weightI32[7168 1024]
-
blk.49.attn_v.weightQ4_K[7168 1024]
-
blk.49.attn_output.weightQ3_K[7168 7168]
-
blk.49.ffn_gate.weightI32[7168 19200]
-
blk.49.ffn_up.weightI32[7168 19200]
-
blk.49.ffn_down.weightI32[19200 7168]
-
blk.49.attn_norm.weightF32[7168]
-
blk.49.ffn_norm.weightF32[7168]
-
blk.50.attn_q.weightI32[7168 7168]
-
blk.50.attn_k.weightI32[7168 1024]
-
blk.50.attn_v.weightQ4_K[7168 1024]
-
blk.50.attn_output.weightQ3_K[7168 7168]
-
blk.50.ffn_gate.weightI32[7168 19200]
-
blk.50.ffn_up.weightI32[7168 19200]
-
blk.50.ffn_down.weightI32[19200 7168]
-
blk.50.attn_norm.weightF32[7168]
-
blk.50.ffn_norm.weightF32[7168]
-
blk.51.attn_q.weightI32[7168 7168]
-
blk.51.attn_k.weightI32[7168 1024]
-
blk.51.attn_v.weightQ4_K[7168 1024]
-
blk.51.attn_output.weightQ3_K[7168 7168]
-
blk.51.ffn_gate.weightI32[7168 19200]
-
blk.51.ffn_up.weightI32[7168 19200]
-
blk.51.ffn_down.weightI32[19200 7168]
-
blk.51.attn_norm.weightF32[7168]
-
blk.51.ffn_norm.weightF32[7168]
-
blk.52.attn_q.weightI32[7168 7168]
-
blk.52.attn_k.weightI32[7168 1024]
-
blk.52.attn_v.weightQ4_K[7168 1024]
-
blk.52.attn_output.weightQ3_K[7168 7168]
-
blk.52.ffn_gate.weightI32[7168 19200]
-
blk.52.ffn_up.weightI32[7168 19200]
-
blk.52.ffn_down.weightI32[19200 7168]
-
blk.52.attn_norm.weightF32[7168]
-
blk.52.ffn_norm.weightF32[7168]
-
blk.53.attn_q.weightI32[7168 7168]
-
blk.53.attn_k.weightI32[7168 1024]
-
blk.53.attn_v.weightQ4_K[7168 1024]
-
blk.53.attn_output.weightQ3_K[7168 7168]
-
blk.53.ffn_gate.weightI32[7168 19200]
-
blk.53.ffn_up.weightI32[7168 19200]
-
blk.53.ffn_down.weightI32[19200 7168]
-
blk.53.attn_norm.weightF32[7168]
-
blk.53.ffn_norm.weightF32[7168]
-
blk.54.attn_q.weightI32[7168 7168]
-
blk.54.attn_k.weightI32[7168 1024]
-
blk.54.attn_v.weightQ4_K[7168 1024]
-
blk.54.attn_output.weightQ3_K[7168 7168]
-
blk.54.ffn_gate.weightI32[7168 19200]
-
blk.54.ffn_up.weightI32[7168 19200]
-
blk.54.ffn_down.weightI32[19200 7168]
-
blk.54.attn_norm.weightF32[7168]
-
blk.54.ffn_norm.weightF32[7168]
-
blk.55.attn_q.weightI32[7168 7168]
-
blk.55.attn_k.weightI32[7168 1024]
-
blk.55.attn_v.weightQ4_K[7168 1024]
-
blk.55.attn_output.weightQ3_K[7168 7168]
-
blk.55.ffn_gate.weightI32[7168 19200]
-
blk.55.ffn_up.weightI32[7168 19200]
-
blk.55.ffn_down.weightI32[19200 7168]
-
blk.55.attn_norm.weightF32[7168]
-
blk.55.ffn_norm.weightF32[7168]
-
blk.56.attn_q.weightI32[7168 7168]
-
blk.56.attn_k.weightI32[7168 1024]
-
blk.56.attn_v.weightQ4_K[7168 1024]
-
blk.56.attn_output.weightQ3_K[7168 7168]
-
blk.56.ffn_gate.weightI32[7168 19200]
-
blk.56.ffn_up.weightI32[7168 19200]
-
blk.56.ffn_down.weightI32[19200 7168]
-
blk.56.attn_norm.weightF32[7168]
-
blk.56.ffn_norm.weightF32[7168]
-
blk.57.attn_q.weightI32[7168 7168]
-
blk.57.attn_k.weightI32[7168 1024]
-
blk.57.attn_v.weightQ4_K[7168 1024]
-
blk.57.attn_output.weightQ3_K[7168 7168]
-
blk.57.ffn_gate.weightI32[7168 19200]
-
blk.57.ffn_up.weightI32[7168 19200]
-
blk.57.ffn_down.weightI32[19200 7168]
-
blk.57.attn_norm.weightF32[7168]
-
blk.57.ffn_norm.weightF32[7168]
-
blk.58.attn_q.weightI32[7168 7168]
-
blk.58.attn_k.weightI32[7168 1024]
-
blk.58.attn_v.weightQ4_K[7168 1024]
-
blk.58.attn_output.weightQ3_K[7168 7168]
-
blk.58.ffn_gate.weightI32[7168 19200]
-
blk.58.ffn_up.weightI32[7168 19200]
-
blk.58.ffn_down.weightI32[19200 7168]
-
blk.58.attn_norm.weightF32[7168]
-
blk.58.ffn_norm.weightF32[7168]
-
blk.59.attn_q.weightI32[7168 7168]
-
blk.59.attn_k.weightI32[7168 1024]
-
blk.59.attn_v.weightQ4_K[7168 1024]
-
blk.59.attn_output.weightQ3_K[7168 7168]
-
blk.59.ffn_gate.weightI32[7168 19200]
-
blk.59.ffn_up.weightI32[7168 19200]
-
blk.59.ffn_down.weightI32[19200 7168]
-
blk.59.attn_norm.weightF32[7168]
-
blk.59.ffn_norm.weightF32[7168]
-
blk.60.attn_q.weightI32[7168 7168]
-
blk.60.attn_k.weightI32[7168 1024]
-
blk.60.attn_v.weightQ4_K[7168 1024]
-
blk.60.attn_output.weightQ3_K[7168 7168]
-
blk.60.ffn_gate.weightI32[7168 19200]
-
blk.60.ffn_up.weightI32[7168 19200]
-
blk.60.ffn_down.weightI32[19200 7168]
-
blk.60.attn_norm.weightF32[7168]
-
blk.60.ffn_norm.weightF32[7168]
-
blk.61.attn_q.weightI32[7168 7168]
-
blk.61.attn_k.weightI32[7168 1024]
-
blk.61.attn_v.weightQ4_K[7168 1024]
-
blk.61.attn_output.weightQ3_K[7168 7168]
-
blk.61.ffn_gate.weightI32[7168 19200]
-
blk.61.ffn_up.weightI32[7168 19200]
-
blk.61.ffn_down.weightI32[19200 7168]
-
blk.61.attn_norm.weightF32[7168]
-
blk.61.ffn_norm.weightF32[7168]
-
output_norm.weightF32[7168]
-
output.weightQ6_K[7168 32256]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61