latest
35GB
This is a new kind of model optimization. This model is based on MaziyarPanahi/calme-2.1-qwen2-72b, which was tuned from Qwen2-72B.
18 Pulls Updated 2 weeks ago
49aabbef3a7d · 35GB
-
quantize.imatrix.chunks_count68
-
quantize.imatrix.datasetgroup_40.txt
-
quantize.imatrix.entries_count602
-
quantize.imatrix.file./RYS-XLarge-GGUF_imatrix.dat
-
general.architectureqwen2
-
general.file_typeIQ3_XS
-
qwen2.attention.head_count64
-
qwen2.attention.head_count_kv8
-
qwen2.attention.layer_norm_rms_epsilon1e-06
-
qwen2.block_count86
-
qwen2.context_length32768
-
qwen2.embedding_length8192
-
qwen2.feed_forward_length29568
-
qwen2.rope.freq_base1e+06
-
tokenizer.ggml.bos_token_id151643
-
tokenizer.ggml.eos_token_id151645
-
tokenizer.ggml.merges[Ġ Ġ ĠĠ ĠĠ i n Ġ t ĠĠĠĠ ĠĠĠĠ ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id151643
-
tokenizer.ggml.preqwen2
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weight(!unknown_type 21!)[8192 151646]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.0.ffn_gate.weight(!unknown_type 21!)[8192 29568]
-
blk.0.ffn_up.weight(!unknown_type 21!)[8192 29568]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.attn_k.biasF32[1024]
-
blk.0.attn_k.weightI32[8192 1024]
-
blk.0.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.0.attn_q.biasF32[8192]
-
blk.0.attn_q.weightI32[8192 8192]
-
blk.0.attn_v.biasF32[1024]
-
blk.0.attn_v.weightQ4_K[8192 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.1.ffn_gate.weight(!unknown_type 21!)[8192 29568]
-
blk.1.ffn_up.weight(!unknown_type 21!)[8192 29568]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.1.attn_k.biasF32[1024]
-
blk.1.attn_k.weightI32[8192 1024]
-
blk.1.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.1.attn_q.biasF32[8192]
-
blk.1.attn_q.weightI32[8192 8192]
-
blk.1.attn_v.biasF32[1024]
-
blk.1.attn_v.weightQ4_K[8192 1024]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.2.ffn_gate.weight(!unknown_type 21!)[8192 29568]
-
blk.2.ffn_up.weight(!unknown_type 21!)[8192 29568]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.2.attn_k.biasF32[1024]
-
blk.2.attn_k.weightI32[8192 1024]
-
blk.2.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.2.attn_q.biasF32[8192]
-
blk.2.attn_q.weightI32[8192 8192]
-
blk.2.attn_v.biasF32[1024]
-
blk.2.attn_v.weightQ4_K[8192 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.3.ffn_gate.weight(!unknown_type 21!)[8192 29568]
-
blk.3.ffn_up.weight(!unknown_type 21!)[8192 29568]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.3.attn_k.biasF32[1024]
-
blk.3.attn_k.weightI32[8192 1024]
-
blk.3.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.3.attn_q.biasF32[8192]
-
blk.3.attn_q.weightI32[8192 8192]
-
blk.3.attn_v.biasF32[1024]
-
blk.3.attn_v.weightQ4_K[8192 1024]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.4.ffn_gate.weight(!unknown_type 21!)[8192 29568]
-
blk.4.ffn_up.weight(!unknown_type 21!)[8192 29568]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.4.attn_k.biasF32[1024]
-
blk.4.attn_k.weightI32[8192 1024]
-
blk.4.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.4.attn_q.biasF32[8192]
-
blk.4.attn_q.weightI32[8192 8192]
-
blk.4.attn_v.biasF32[1024]
-
blk.4.attn_v.weightQ4_K[8192 1024]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.5.ffn_gate.weight(!unknown_type 21!)[8192 29568]
-
blk.5.ffn_up.weight(!unknown_type 21!)[8192 29568]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.5.attn_k.biasF32[1024]
-
blk.5.attn_k.weightI32[8192 1024]
-
blk.5.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.5.attn_q.biasF32[8192]
-
blk.5.attn_q.weightI32[8192 8192]
-
blk.5.attn_v.biasF32[1024]
-
blk.5.attn_v.weightQ4_K[8192 1024]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.6.ffn_gate.weight(!unknown_type 21!)[8192 29568]
-
blk.6.ffn_up.weight(!unknown_type 21!)[8192 29568]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.6.attn_k.biasF32[1024]
-
blk.6.attn_k.weightI32[8192 1024]
-
blk.6.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.6.attn_q.biasF32[8192]
-
blk.6.attn_q.weightI32[8192 8192]
-
blk.6.attn_v.biasF32[1024]
-
blk.6.attn_v.weightQ4_K[8192 1024]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.7.ffn_gate.weight(!unknown_type 21!)[8192 29568]
-
blk.7.ffn_up.weight(!unknown_type 21!)[8192 29568]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.7.attn_k.biasF32[1024]
-
blk.7.attn_k.weightI32[8192 1024]
-
blk.7.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.7.attn_q.biasF32[8192]
-
blk.7.attn_q.weightI32[8192 8192]
-
blk.7.attn_v.biasF32[1024]
-
blk.7.attn_v.weightQ4_K[8192 1024]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.8.ffn_gate.weight(!unknown_type 21!)[8192 29568]
-
blk.8.ffn_up.weight(!unknown_type 21!)[8192 29568]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.attn_k.biasF32[1024]
-
blk.8.attn_k.weightI32[8192 1024]
-
blk.8.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.8.attn_q.biasF32[8192]
-
blk.8.attn_q.weightI32[8192 8192]
-
blk.8.attn_v.biasF32[1024]
-
blk.8.attn_v.weightQ4_K[8192 1024]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.9.ffn_gate.weight(!unknown_type 21!)[8192 29568]
-
blk.9.ffn_up.weight(!unknown_type 21!)[8192 29568]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.attn_k.biasF32[1024]
-
blk.9.attn_k.weightI32[8192 1024]
-
blk.9.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.9.attn_q.biasF32[8192]
-
blk.9.attn_q.weightI32[8192 8192]
-
blk.9.attn_v.biasF32[1024]
-
blk.9.attn_v.weightQ4_K[8192 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.10.ffn_gate.weightI32[8192 29568]
-
blk.10.ffn_up.weightI32[8192 29568]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.10.attn_k.biasF32[1024]
-
blk.10.attn_k.weightI32[8192 1024]
-
blk.10.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.10.attn_q.biasF32[8192]
-
blk.10.attn_q.weightI32[8192 8192]
-
blk.10.attn_v.biasF32[1024]
-
blk.10.attn_v.weightQ4_K[8192 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.11.ffn_gate.weightI32[8192 29568]
-
blk.11.ffn_up.weightI32[8192 29568]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.11.attn_k.biasF32[1024]
-
blk.11.attn_k.weightI32[8192 1024]
-
blk.11.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.11.attn_q.biasF32[8192]
-
blk.11.attn_q.weightI32[8192 8192]
-
blk.11.attn_v.biasF32[1024]
-
blk.11.attn_v.weightQ4_K[8192 1024]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.12.ffn_gate.weightI32[8192 29568]
-
blk.12.ffn_up.weightI32[8192 29568]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.12.attn_k.biasF32[1024]
-
blk.12.attn_k.weightI32[8192 1024]
-
blk.12.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.12.attn_q.biasF32[8192]
-
blk.12.attn_q.weightI32[8192 8192]
-
blk.12.attn_v.biasF32[1024]
-
blk.12.attn_v.weightQ4_K[8192 1024]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.13.ffn_gate.weightI32[8192 29568]
-
blk.13.ffn_up.weightI32[8192 29568]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.13.attn_k.biasF32[1024]
-
blk.13.attn_k.weightI32[8192 1024]
-
blk.13.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.13.attn_q.biasF32[8192]
-
blk.13.attn_q.weightI32[8192 8192]
-
blk.13.attn_v.biasF32[1024]
-
blk.13.attn_v.weightQ4_K[8192 1024]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.14.ffn_gate.weightI32[8192 29568]
-
blk.14.ffn_up.weightI32[8192 29568]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.14.attn_k.biasF32[1024]
-
blk.14.attn_k.weightI32[8192 1024]
-
blk.14.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.14.attn_q.biasF32[8192]
-
blk.14.attn_q.weightI32[8192 8192]
-
blk.14.attn_v.biasF32[1024]
-
blk.14.attn_v.weightQ4_K[8192 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.15.ffn_gate.weightI32[8192 29568]
-
blk.15.ffn_up.weightI32[8192 29568]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.15.attn_k.biasF32[1024]
-
blk.15.attn_k.weightI32[8192 1024]
-
blk.15.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.15.attn_q.biasF32[8192]
-
blk.15.attn_q.weightI32[8192 8192]
-
blk.15.attn_v.biasF32[1024]
-
blk.15.attn_v.weightQ4_K[8192 1024]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.16.ffn_gate.weightI32[8192 29568]
-
blk.16.ffn_up.weightI32[8192 29568]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.16.attn_k.biasF32[1024]
-
blk.16.attn_k.weightI32[8192 1024]
-
blk.16.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.16.attn_q.biasF32[8192]
-
blk.16.attn_q.weightI32[8192 8192]
-
blk.16.attn_v.biasF32[1024]
-
blk.16.attn_v.weightQ4_K[8192 1024]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.17.ffn_gate.weightI32[8192 29568]
-
blk.17.ffn_up.weightI32[8192 29568]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.17.attn_k.biasF32[1024]
-
blk.17.attn_k.weightI32[8192 1024]
-
blk.17.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.17.attn_q.biasF32[8192]
-
blk.17.attn_q.weightI32[8192 8192]
-
blk.17.attn_v.biasF32[1024]
-
blk.17.attn_v.weightQ4_K[8192 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.18.ffn_gate.weightI32[8192 29568]
-
blk.18.ffn_up.weightI32[8192 29568]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.18.attn_k.biasF32[1024]
-
blk.18.attn_k.weightI32[8192 1024]
-
blk.18.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.18.attn_q.biasF32[8192]
-
blk.18.attn_q.weightI32[8192 8192]
-
blk.18.attn_v.biasF32[1024]
-
blk.18.attn_v.weightQ4_K[8192 1024]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.19.ffn_gate.weightI32[8192 29568]
-
blk.19.ffn_up.weightI32[8192 29568]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.19.attn_k.biasF32[1024]
-
blk.19.attn_k.weightI32[8192 1024]
-
blk.19.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.19.attn_q.biasF32[8192]
-
blk.19.attn_q.weightI32[8192 8192]
-
blk.19.attn_v.biasF32[1024]
-
blk.19.attn_v.weightQ4_K[8192 1024]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.20.ffn_gate.weightI32[8192 29568]
-
blk.20.ffn_up.weightI32[8192 29568]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.20.attn_k.biasF32[1024]
-
blk.20.attn_k.weightI32[8192 1024]
-
blk.20.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.20.attn_q.biasF32[8192]
-
blk.20.attn_q.weightI32[8192 8192]
-
blk.20.attn_v.biasF32[1024]
-
blk.20.attn_v.weightQ4_K[8192 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.21.ffn_gate.weightI32[8192 29568]
-
blk.21.ffn_up.weightI32[8192 29568]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.attn_k.biasF32[1024]
-
blk.21.attn_k.weightI32[8192 1024]
-
blk.21.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.21.attn_q.biasF32[8192]
-
blk.21.attn_q.weightI32[8192 8192]
-
blk.21.attn_v.biasF32[1024]
-
blk.21.attn_v.weightQ4_K[8192 1024]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.22.ffn_gate.weightI32[8192 29568]
-
blk.22.ffn_up.weightI32[8192 29568]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.22.attn_k.biasF32[1024]
-
blk.22.attn_k.weightI32[8192 1024]
-
blk.22.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.22.attn_q.biasF32[8192]
-
blk.22.attn_q.weightI32[8192 8192]
-
blk.22.attn_v.biasF32[1024]
-
blk.22.attn_v.weightQ4_K[8192 1024]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.23.ffn_gate.weightI32[8192 29568]
-
blk.23.ffn_up.weightI32[8192 29568]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.23.attn_k.biasF32[1024]
-
blk.23.attn_k.weightI32[8192 1024]
-
blk.23.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.23.attn_q.biasF32[8192]
-
blk.23.attn_q.weightI32[8192 8192]
-
blk.23.attn_v.biasF32[1024]
-
blk.23.attn_v.weightQ4_K[8192 1024]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.24.ffn_gate.weightI32[8192 29568]
-
blk.24.ffn_up.weightI32[8192 29568]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.attn_k.biasF32[1024]
-
blk.24.attn_k.weightI32[8192 1024]
-
blk.24.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.24.attn_q.biasF32[8192]
-
blk.24.attn_q.weightI32[8192 8192]
-
blk.24.attn_v.biasF32[1024]
-
blk.24.attn_v.weightQ4_K[8192 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.25.ffn_gate.weightI32[8192 29568]
-
blk.25.ffn_up.weightI32[8192 29568]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.attn_k.biasF32[1024]
-
blk.25.attn_k.weightI32[8192 1024]
-
blk.25.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.25.attn_q.biasF32[8192]
-
blk.25.attn_q.weightI32[8192 8192]
-
blk.25.attn_v.biasF32[1024]
-
blk.25.attn_v.weightQ4_K[8192 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.26.ffn_gate.weightI32[8192 29568]
-
blk.26.ffn_up.weightI32[8192 29568]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.26.attn_k.biasF32[1024]
-
blk.26.attn_k.weightI32[8192 1024]
-
blk.26.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.26.attn_q.biasF32[8192]
-
blk.26.attn_q.weightI32[8192 8192]
-
blk.26.attn_v.biasF32[1024]
-
blk.26.attn_v.weightQ4_K[8192 1024]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.27.ffn_gate.weightI32[8192 29568]
-
blk.27.ffn_up.weightI32[8192 29568]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.27.attn_k.biasF32[1024]
-
blk.27.attn_k.weightI32[8192 1024]
-
blk.27.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.27.attn_q.biasF32[8192]
-
blk.27.attn_q.weightI32[8192 8192]
-
blk.27.attn_v.biasF32[1024]
-
blk.27.attn_v.weightQ4_K[8192 1024]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.28.ffn_gate.weightI32[8192 29568]
-
blk.28.ffn_up.weightI32[8192 29568]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.attn_k.biasF32[1024]
-
blk.28.attn_k.weightI32[8192 1024]
-
blk.28.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.28.attn_q.biasF32[8192]
-
blk.28.attn_q.weightI32[8192 8192]
-
blk.28.attn_v.biasF32[1024]
-
blk.28.attn_v.weightQ4_K[8192 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.29.ffn_gate.weightI32[8192 29568]
-
blk.29.ffn_up.weightI32[8192 29568]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.29.attn_k.biasF32[1024]
-
blk.29.attn_k.weightI32[8192 1024]
-
blk.29.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.29.attn_q.biasF32[8192]
-
blk.29.attn_q.weightI32[8192 8192]
-
blk.29.attn_v.biasF32[1024]
-
blk.29.attn_v.weightQ4_K[8192 1024]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.30.ffn_gate.weightI32[8192 29568]
-
blk.30.ffn_up.weightI32[8192 29568]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.30.attn_k.biasF32[1024]
-
blk.30.attn_k.weightI32[8192 1024]
-
blk.30.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.30.attn_q.biasF32[8192]
-
blk.30.attn_q.weightI32[8192 8192]
-
blk.30.attn_v.biasF32[1024]
-
blk.30.attn_v.weightQ4_K[8192 1024]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.31.ffn_gate.weightI32[8192 29568]
-
blk.31.ffn_up.weightI32[8192 29568]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.31.attn_k.biasF32[1024]
-
blk.31.attn_k.weightI32[8192 1024]
-
blk.31.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.31.attn_q.biasF32[8192]
-
blk.31.attn_q.weightI32[8192 8192]
-
blk.31.attn_v.biasF32[1024]
-
blk.31.attn_v.weightQ4_K[8192 1024]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.32.ffn_gate.weightI32[8192 29568]
-
blk.32.ffn_up.weightI32[8192 29568]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.32.attn_k.biasF32[1024]
-
blk.32.attn_k.weightI32[8192 1024]
-
blk.32.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.32.attn_q.biasF32[8192]
-
blk.32.attn_q.weightI32[8192 8192]
-
blk.32.attn_v.biasF32[1024]
-
blk.32.attn_v.weightQ4_K[8192 1024]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.33.ffn_gate.weightI32[8192 29568]
-
blk.33.ffn_up.weightI32[8192 29568]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.33.attn_k.biasF32[1024]
-
blk.33.attn_k.weightI32[8192 1024]
-
blk.33.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.33.attn_q.biasF32[8192]
-
blk.33.attn_q.weightI32[8192 8192]
-
blk.33.attn_v.biasF32[1024]
-
blk.33.attn_v.weightQ4_K[8192 1024]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.34.ffn_gate.weightI32[8192 29568]
-
blk.34.ffn_up.weightI32[8192 29568]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.34.attn_k.biasF32[1024]
-
blk.34.attn_k.weightI32[8192 1024]
-
blk.34.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.34.attn_q.biasF32[8192]
-
blk.34.attn_q.weightI32[8192 8192]
-
blk.34.attn_v.biasF32[1024]
-
blk.34.attn_v.weightQ4_K[8192 1024]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.35.ffn_gate.weightI32[8192 29568]
-
blk.35.ffn_up.weightI32[8192 29568]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.35.attn_k.biasF32[1024]
-
blk.35.attn_k.weightI32[8192 1024]
-
blk.35.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.35.attn_q.biasF32[8192]
-
blk.35.attn_q.weightI32[8192 8192]
-
blk.35.attn_v.biasF32[1024]
-
blk.35.attn_v.weightQ4_K[8192 1024]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.36.ffn_gate.weightI32[8192 29568]
-
blk.36.ffn_up.weightI32[8192 29568]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.attn_k.biasF32[1024]
-
blk.36.attn_k.weightI32[8192 1024]
-
blk.36.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.36.attn_q.biasF32[8192]
-
blk.36.attn_q.weightI32[8192 8192]
-
blk.36.attn_v.biasF32[1024]
-
blk.36.attn_v.weightQ4_K[8192 1024]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.37.ffn_gate.weightI32[8192 29568]
-
blk.37.ffn_up.weightI32[8192 29568]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.attn_k.biasF32[1024]
-
blk.37.attn_k.weightI32[8192 1024]
-
blk.37.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.37.attn_q.biasF32[8192]
-
blk.37.attn_q.weightI32[8192 8192]
-
blk.37.attn_v.biasF32[1024]
-
blk.37.attn_v.weightQ4_K[8192 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.38.ffn_gate.weightI32[8192 29568]
-
blk.38.ffn_up.weightI32[8192 29568]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.38.attn_k.biasF32[1024]
-
blk.38.attn_k.weightI32[8192 1024]
-
blk.38.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.38.attn_q.biasF32[8192]
-
blk.38.attn_q.weightI32[8192 8192]
-
blk.38.attn_v.biasF32[1024]
-
blk.38.attn_v.weightQ4_K[8192 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.39.ffn_gate.weightI32[8192 29568]
-
blk.39.ffn_up.weightI32[8192 29568]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.39.attn_k.biasF32[1024]
-
blk.39.attn_k.weightI32[8192 1024]
-
blk.39.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.39.attn_q.biasF32[8192]
-
blk.39.attn_q.weightI32[8192 8192]
-
blk.39.attn_v.biasF32[1024]
-
blk.39.attn_v.weightQ4_K[8192 1024]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.40.ffn_gate.weightI32[8192 29568]
-
blk.40.ffn_up.weightI32[8192 29568]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.40.attn_k.biasF32[1024]
-
blk.40.attn_k.weightI32[8192 1024]
-
blk.40.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.40.attn_q.biasF32[8192]
-
blk.40.attn_q.weightI32[8192 8192]
-
blk.40.attn_v.biasF32[1024]
-
blk.40.attn_v.weightQ4_K[8192 1024]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.41.ffn_gate.weightI32[8192 29568]
-
blk.41.ffn_up.weightI32[8192 29568]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.41.attn_k.biasF32[1024]
-
blk.41.attn_k.weightI32[8192 1024]
-
blk.41.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.41.attn_q.biasF32[8192]
-
blk.41.attn_q.weightI32[8192 8192]
-
blk.41.attn_v.biasF32[1024]
-
blk.41.attn_v.weightQ4_K[8192 1024]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.42.ffn_gate.weightI32[8192 29568]
-
blk.42.ffn_up.weightI32[8192 29568]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.42.attn_k.biasF32[1024]
-
blk.42.attn_k.weightI32[8192 1024]
-
blk.42.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.42.attn_q.biasF32[8192]
-
blk.42.attn_q.weightI32[8192 8192]
-
blk.42.attn_v.biasF32[1024]
-
blk.42.attn_v.weightQ4_K[8192 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.43.ffn_gate.weightI32[8192 29568]
-
blk.43.ffn_up.weightI32[8192 29568]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.43.attn_k.biasF32[1024]
-
blk.43.attn_k.weightI32[8192 1024]
-
blk.43.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.43.attn_q.biasF32[8192]
-
blk.43.attn_q.weightI32[8192 8192]
-
blk.43.attn_v.biasF32[1024]
-
blk.43.attn_v.weightQ4_K[8192 1024]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.44.ffn_gate.weightI32[8192 29568]
-
blk.44.ffn_up.weightI32[8192 29568]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.44.attn_k.biasF32[1024]
-
blk.44.attn_k.weightI32[8192 1024]
-
blk.44.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.44.attn_q.biasF32[8192]
-
blk.44.attn_q.weightI32[8192 8192]
-
blk.44.attn_v.biasF32[1024]
-
blk.44.attn_v.weightQ4_K[8192 1024]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.45.ffn_gate.weightI32[8192 29568]
-
blk.45.ffn_up.weightI32[8192 29568]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.attn_k.biasF32[1024]
-
blk.45.attn_k.weightI32[8192 1024]
-
blk.45.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.45.attn_q.biasF32[8192]
-
blk.45.attn_q.weightI32[8192 8192]
-
blk.45.attn_v.biasF32[1024]
-
blk.45.attn_v.weightQ4_K[8192 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.46.ffn_gate.weightI32[8192 29568]
-
blk.46.ffn_up.weightI32[8192 29568]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.46.attn_k.biasF32[1024]
-
blk.46.attn_k.weightI32[8192 1024]
-
blk.46.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.46.attn_q.biasF32[8192]
-
blk.46.attn_q.weightI32[8192 8192]
-
blk.46.attn_v.biasF32[1024]
-
blk.46.attn_v.weightQ4_K[8192 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.47.ffn_gate.weightI32[8192 29568]
-
blk.47.ffn_up.weightI32[8192 29568]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.47.attn_k.biasF32[1024]
-
blk.47.attn_k.weightI32[8192 1024]
-
blk.47.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.47.attn_q.biasF32[8192]
-
blk.47.attn_q.weightI32[8192 8192]
-
blk.47.attn_v.biasF32[1024]
-
blk.47.attn_v.weightQ4_K[8192 1024]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.48.ffn_gate.weightI32[8192 29568]
-
blk.48.ffn_up.weightI32[8192 29568]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.48.attn_k.biasF32[1024]
-
blk.48.attn_k.weightI32[8192 1024]
-
blk.48.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.48.attn_q.biasF32[8192]
-
blk.48.attn_q.weightI32[8192 8192]
-
blk.48.attn_v.biasF32[1024]
-
blk.48.attn_v.weightQ4_K[8192 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.49.ffn_gate.weightI32[8192 29568]
-
blk.49.ffn_up.weightI32[8192 29568]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.49.attn_k.biasF32[1024]
-
blk.49.attn_k.weightI32[8192 1024]
-
blk.49.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.49.attn_q.biasF32[8192]
-
blk.49.attn_q.weightI32[8192 8192]
-
blk.49.attn_v.biasF32[1024]
-
blk.49.attn_v.weightQ4_K[8192 1024]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.50.ffn_gate.weightI32[8192 29568]
-
blk.50.ffn_up.weightI32[8192 29568]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.50.attn_k.biasF32[1024]
-
blk.50.attn_k.weightI32[8192 1024]
-
blk.50.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.50.attn_q.biasF32[8192]
-
blk.50.attn_q.weightI32[8192 8192]
-
blk.50.attn_v.biasF32[1024]
-
blk.50.attn_v.weightQ4_K[8192 1024]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.51.ffn_gate.weightI32[8192 29568]
-
blk.51.ffn_up.weightI32[8192 29568]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.51.attn_k.biasF32[1024]
-
blk.51.attn_k.weightI32[8192 1024]
-
blk.51.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.51.attn_q.biasF32[8192]
-
blk.51.attn_q.weightI32[8192 8192]
-
blk.51.attn_v.biasF32[1024]
-
blk.51.attn_v.weightQ4_K[8192 1024]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.52.ffn_gate.weightI32[8192 29568]
-
blk.52.ffn_up.weightI32[8192 29568]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.52.attn_k.biasF32[1024]
-
blk.52.attn_k.weightI32[8192 1024]
-
blk.52.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.52.attn_q.biasF32[8192]
-
blk.52.attn_q.weightI32[8192 8192]
-
blk.52.attn_v.biasF32[1024]
-
blk.52.attn_v.weightQ4_K[8192 1024]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.53.ffn_gate.weightI32[8192 29568]
-
blk.53.ffn_up.weightI32[8192 29568]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.53.attn_k.biasF32[1024]
-
blk.53.attn_k.weightI32[8192 1024]
-
blk.53.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.53.attn_q.biasF32[8192]
-
blk.53.attn_q.weightI32[8192 8192]
-
blk.53.attn_v.biasF32[1024]
-
blk.53.attn_v.weightQ4_K[8192 1024]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.54.ffn_gate.weightI32[8192 29568]
-
blk.54.ffn_up.weightI32[8192 29568]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.54.attn_k.biasF32[1024]
-
blk.54.attn_k.weightI32[8192 1024]
-
blk.54.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.54.attn_q.biasF32[8192]
-
blk.54.attn_q.weightI32[8192 8192]
-
blk.54.attn_v.biasF32[1024]
-
blk.54.attn_v.weightQ4_K[8192 1024]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.55.ffn_gate.weightI32[8192 29568]
-
blk.55.ffn_up.weightI32[8192 29568]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.55.attn_k.biasF32[1024]
-
blk.55.attn_k.weightI32[8192 1024]
-
blk.55.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.55.attn_q.biasF32[8192]
-
blk.55.attn_q.weightI32[8192 8192]
-
blk.55.attn_v.biasF32[1024]
-
blk.55.attn_v.weightQ4_K[8192 1024]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.56.ffn_gate.weightI32[8192 29568]
-
blk.56.ffn_up.weightI32[8192 29568]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.56.attn_k.biasF32[1024]
-
blk.56.attn_k.weightI32[8192 1024]
-
blk.56.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.56.attn_q.biasF32[8192]
-
blk.56.attn_q.weightI32[8192 8192]
-
blk.56.attn_v.biasF32[1024]
-
blk.56.attn_v.weightQ4_K[8192 1024]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.57.ffn_gate.weightI32[8192 29568]
-
blk.57.ffn_up.weightI32[8192 29568]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.57.attn_k.biasF32[1024]
-
blk.57.attn_k.weightI32[8192 1024]
-
blk.57.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.57.attn_q.biasF32[8192]
-
blk.57.attn_q.weightI32[8192 8192]
-
blk.57.attn_v.biasF32[1024]
-
blk.57.attn_v.weightQ4_K[8192 1024]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.58.ffn_gate.weightI32[8192 29568]
-
blk.58.ffn_up.weightI32[8192 29568]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.58.attn_k.biasF32[1024]
-
blk.58.attn_k.weightI32[8192 1024]
-
blk.58.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.58.attn_q.biasF32[8192]
-
blk.58.attn_q.weightI32[8192 8192]
-
blk.58.attn_v.biasF32[1024]
-
blk.58.attn_v.weightQ4_K[8192 1024]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.59.ffn_gate.weightI32[8192 29568]
-
blk.59.ffn_up.weightI32[8192 29568]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.59.attn_k.biasF32[1024]
-
blk.59.attn_k.weightI32[8192 1024]
-
blk.59.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.59.attn_q.biasF32[8192]
-
blk.59.attn_q.weightI32[8192 8192]
-
blk.59.attn_v.biasF32[1024]
-
blk.59.attn_v.weightQ4_K[8192 1024]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.60.ffn_gate.weightI32[8192 29568]
-
blk.60.ffn_up.weightI32[8192 29568]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.60.attn_k.biasF32[1024]
-
blk.60.attn_k.weightI32[8192 1024]
-
blk.60.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.60.attn_q.biasF32[8192]
-
blk.60.attn_q.weightI32[8192 8192]
-
blk.60.attn_v.biasF32[1024]
-
blk.60.attn_v.weightQ4_K[8192 1024]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.61.ffn_gate.weightI32[8192 29568]
-
blk.61.ffn_up.weightI32[8192 29568]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.61.attn_k.biasF32[1024]
-
blk.61.attn_k.weightI32[8192 1024]
-
blk.61.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.61.attn_q.biasF32[8192]
-
blk.61.attn_q.weightI32[8192 8192]
-
blk.61.attn_v.biasF32[1024]
-
blk.61.attn_v.weightQ4_K[8192 1024]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.62.ffn_gate.weightI32[8192 29568]
-
blk.62.ffn_up.weightI32[8192 29568]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.62.attn_k.biasF32[1024]
-
blk.62.attn_k.weightI32[8192 1024]
-
blk.62.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.62.attn_q.biasF32[8192]
-
blk.62.attn_q.weightI32[8192 8192]
-
blk.62.attn_v.biasF32[1024]
-
blk.62.attn_v.weightQ4_K[8192 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.63.ffn_gate.weightI32[8192 29568]
-
blk.63.ffn_up.weightI32[8192 29568]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.63.attn_k.biasF32[1024]
-
blk.63.attn_k.weightI32[8192 1024]
-
blk.63.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.63.attn_q.biasF32[8192]
-
blk.63.attn_q.weightI32[8192 8192]
-
blk.63.attn_v.biasF32[1024]
-
blk.63.attn_v.weightQ4_K[8192 1024]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.64.ffn_gate.weightI32[8192 29568]
-
blk.64.ffn_up.weightI32[8192 29568]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.64.attn_k.biasF32[1024]
-
blk.64.attn_k.weightI32[8192 1024]
-
blk.64.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.64.attn_q.biasF32[8192]
-
blk.64.attn_q.weightI32[8192 8192]
-
blk.64.attn_v.biasF32[1024]
-
blk.64.attn_v.weightQ4_K[8192 1024]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.65.ffn_gate.weightI32[8192 29568]
-
blk.65.ffn_up.weightI32[8192 29568]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.attn_k.biasF32[1024]
-
blk.65.attn_k.weightI32[8192 1024]
-
blk.65.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.65.attn_q.biasF32[8192]
-
blk.65.attn_q.weightI32[8192 8192]
-
blk.65.attn_v.biasF32[1024]
-
blk.65.attn_v.weightQ4_K[8192 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.66.ffn_gate.weightI32[8192 29568]
-
blk.66.ffn_up.weightI32[8192 29568]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.66.attn_k.biasF32[1024]
-
blk.66.attn_k.weightI32[8192 1024]
-
blk.66.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.66.attn_q.biasF32[8192]
-
blk.66.attn_q.weightI32[8192 8192]
-
blk.66.attn_v.biasF32[1024]
-
blk.66.attn_v.weightQ4_K[8192 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.67.ffn_gate.weightI32[8192 29568]
-
blk.67.ffn_up.weightI32[8192 29568]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.67.attn_k.biasF32[1024]
-
blk.67.attn_k.weightI32[8192 1024]
-
blk.67.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.67.attn_q.biasF32[8192]
-
blk.67.attn_q.weightI32[8192 8192]
-
blk.67.attn_v.biasF32[1024]
-
blk.67.attn_v.weightQ4_K[8192 1024]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.68.ffn_gate.weightI32[8192 29568]
-
blk.68.ffn_up.weightI32[8192 29568]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.68.attn_k.biasF32[1024]
-
blk.68.attn_k.weightI32[8192 1024]
-
blk.68.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.68.attn_q.biasF32[8192]
-
blk.68.attn_q.weightI32[8192 8192]
-
blk.68.attn_v.biasF32[1024]
-
blk.68.attn_v.weightQ4_K[8192 1024]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.69.ffn_gate.weightI32[8192 29568]
-
blk.69.ffn_up.weightI32[8192 29568]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.69.attn_k.biasF32[1024]
-
blk.69.attn_k.weightI32[8192 1024]
-
blk.69.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.69.attn_q.biasF32[8192]
-
blk.69.attn_q.weightI32[8192 8192]
-
blk.69.attn_v.biasF32[1024]
-
blk.69.attn_v.weightQ4_K[8192 1024]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.70.ffn_gate.weightI32[8192 29568]
-
blk.70.ffn_up.weightI32[8192 29568]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.70.attn_k.biasF32[1024]
-
blk.70.attn_k.weightI32[8192 1024]
-
blk.70.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.70.attn_q.biasF32[8192]
-
blk.70.attn_q.weightI32[8192 8192]
-
blk.70.attn_v.biasF32[1024]
-
blk.70.attn_v.weightQ4_K[8192 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.71.ffn_gate.weightI32[8192 29568]
-
blk.71.ffn_up.weightI32[8192 29568]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.71.attn_k.biasF32[1024]
-
blk.71.attn_k.weightI32[8192 1024]
-
blk.71.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.71.attn_q.biasF32[8192]
-
blk.71.attn_q.weightI32[8192 8192]
-
blk.71.attn_v.biasF32[1024]
-
blk.71.attn_v.weightQ4_K[8192 1024]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.72.ffn_gate.weightI32[8192 29568]
-
blk.72.ffn_up.weightI32[8192 29568]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.72.attn_k.biasF32[1024]
-
blk.72.attn_k.weightI32[8192 1024]
-
blk.72.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.72.attn_q.biasF32[8192]
-
blk.72.attn_q.weightI32[8192 8192]
-
blk.72.attn_v.biasF32[1024]
-
blk.72.attn_v.weightQ4_K[8192 1024]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.73.ffn_gate.weightI32[8192 29568]
-
blk.73.ffn_up.weightI32[8192 29568]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.attn_k.biasF32[1024]
-
blk.73.attn_k.weightI32[8192 1024]
-
blk.73.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.73.attn_q.biasF32[8192]
-
blk.73.attn_q.weightI32[8192 8192]
-
blk.73.attn_v.biasF32[1024]
-
blk.73.attn_v.weightQ4_K[8192 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.74.ffn_gate.weightI32[8192 29568]
-
blk.74.ffn_up.weightI32[8192 29568]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.74.attn_k.biasF32[1024]
-
blk.74.attn_k.weightI32[8192 1024]
-
blk.74.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.74.attn_q.biasF32[8192]
-
blk.74.attn_q.weightI32[8192 8192]
-
blk.74.attn_v.biasF32[1024]
-
blk.74.attn_v.weightQ4_K[8192 1024]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.75.ffn_gate.weight(!unknown_type 21!)[8192 29568]
-
blk.75.ffn_up.weight(!unknown_type 21!)[8192 29568]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.75.attn_k.biasF32[1024]
-
blk.75.attn_k.weightI32[8192 1024]
-
blk.75.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.75.attn_q.biasF32[8192]
-
blk.75.attn_q.weightI32[8192 8192]
-
blk.75.attn_v.biasF32[1024]
-
blk.75.attn_v.weightQ4_K[8192 1024]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.76.ffn_gate.weight(!unknown_type 21!)[8192 29568]
-
blk.76.ffn_up.weight(!unknown_type 21!)[8192 29568]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.attn_k.biasF32[1024]
-
blk.76.attn_k.weightI32[8192 1024]
-
blk.76.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.76.attn_q.biasF32[8192]
-
blk.76.attn_q.weightI32[8192 8192]
-
blk.76.attn_v.biasF32[1024]
-
blk.76.attn_v.weightQ4_K[8192 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.77.ffn_gate.weight(!unknown_type 21!)[8192 29568]
-
blk.77.ffn_up.weight(!unknown_type 21!)[8192 29568]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.attn_k.biasF32[1024]
-
blk.77.attn_k.weightI32[8192 1024]
-
blk.77.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.77.attn_q.biasF32[8192]
-
blk.77.attn_q.weightI32[8192 8192]
-
blk.77.attn_v.biasF32[1024]
-
blk.77.attn_v.weightQ4_K[8192 1024]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.78.ffn_gate.weight(!unknown_type 21!)[8192 29568]
-
blk.78.ffn_up.weight(!unknown_type 21!)[8192 29568]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.78.attn_k.biasF32[1024]
-
blk.78.attn_k.weightI32[8192 1024]
-
blk.78.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.78.attn_q.biasF32[8192]
-
blk.78.attn_q.weightI32[8192 8192]
-
blk.78.attn_v.biasF32[1024]
-
blk.78.attn_v.weightQ4_K[8192 1024]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.79.ffn_gate.weight(!unknown_type 21!)[8192 29568]
-
blk.79.ffn_up.weight(!unknown_type 21!)[8192 29568]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.79.attn_k.biasF32[1024]
-
blk.79.attn_k.weightI32[8192 1024]
-
blk.79.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.79.attn_q.biasF32[8192]
-
blk.79.attn_q.weightI32[8192 8192]
-
blk.79.attn_v.biasF32[1024]
-
blk.79.attn_v.weightQ4_K[8192 1024]
-
blk.80.attn_norm.weightF32[8192]
-
blk.80.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.80.ffn_gate.weight(!unknown_type 21!)[8192 29568]
-
blk.80.ffn_up.weight(!unknown_type 21!)[8192 29568]
-
blk.80.ffn_norm.weightF32[8192]
-
blk.80.attn_k.biasF32[1024]
-
blk.80.attn_k.weightI32[8192 1024]
-
blk.80.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.80.attn_q.biasF32[8192]
-
blk.80.attn_q.weightI32[8192 8192]
-
blk.80.attn_v.biasF32[1024]
-
blk.80.attn_v.weightQ4_K[8192 1024]
-
blk.81.attn_norm.weightF32[8192]
-
blk.81.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.81.ffn_gate.weight(!unknown_type 21!)[8192 29568]
-
blk.81.ffn_up.weight(!unknown_type 21!)[8192 29568]
-
blk.81.ffn_norm.weightF32[8192]
-
blk.81.attn_k.biasF32[1024]
-
blk.81.attn_k.weightI32[8192 1024]
-
blk.81.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.81.attn_q.biasF32[8192]
-
blk.81.attn_q.weightI32[8192 8192]
-
blk.81.attn_v.biasF32[1024]
-
blk.81.attn_v.weightQ4_K[8192 1024]
-
blk.82.attn_norm.weightF32[8192]
-
blk.82.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.82.ffn_gate.weight(!unknown_type 21!)[8192 29568]
-
blk.82.ffn_up.weight(!unknown_type 21!)[8192 29568]
-
blk.82.ffn_norm.weightF32[8192]
-
blk.82.attn_k.biasF32[1024]
-
blk.82.attn_k.weightI32[8192 1024]
-
blk.82.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.82.attn_q.biasF32[8192]
-
blk.82.attn_q.weightI32[8192 8192]
-
blk.82.attn_v.biasF32[1024]
-
blk.82.attn_v.weightQ4_K[8192 1024]
-
blk.83.attn_norm.weightF32[8192]
-
blk.83.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.83.ffn_gate.weight(!unknown_type 21!)[8192 29568]
-
blk.83.ffn_up.weight(!unknown_type 21!)[8192 29568]
-
blk.83.ffn_norm.weightF32[8192]
-
blk.83.attn_k.biasF32[1024]
-
blk.83.attn_k.weightI32[8192 1024]
-
blk.83.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.83.attn_q.biasF32[8192]
-
blk.83.attn_q.weightI32[8192 8192]
-
blk.83.attn_v.biasF32[1024]
-
blk.83.attn_v.weightQ4_K[8192 1024]
-
blk.84.attn_norm.weightF32[8192]
-
blk.84.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.84.ffn_gate.weight(!unknown_type 21!)[8192 29568]
-
blk.84.ffn_up.weight(!unknown_type 21!)[8192 29568]
-
blk.84.ffn_norm.weightF32[8192]
-
blk.84.attn_k.biasF32[1024]
-
blk.84.attn_k.weightI32[8192 1024]
-
blk.84.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.84.attn_q.biasF32[8192]
-
blk.84.attn_q.weightI32[8192 8192]
-
blk.84.attn_v.biasF32[1024]
-
blk.84.attn_v.weightQ4_K[8192 1024]
-
blk.85.attn_norm.weightF32[8192]
-
blk.85.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.85.ffn_gate.weight(!unknown_type 21!)[8192 29568]
-
blk.85.ffn_up.weight(!unknown_type 21!)[8192 29568]
-
blk.85.ffn_norm.weightF32[8192]
-
blk.85.attn_k.biasF32[1024]
-
blk.85.attn_k.weightI32[8192 1024]
-
blk.85.attn_output.weight(!unknown_type 21!)[8192 8192]
-
blk.85.attn_q.biasF32[8192]
-
blk.85.attn_q.weightI32[8192 8192]
-
blk.85.attn_v.biasF32[1024]
-
blk.85.attn_v.weightQ4_K[8192 1024]
-
output.weightQ6_K[8192 151646]
-
output_norm.weightF32[8192]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79
blk.80
blk.81
blk.82
blk.83
blk.84
blk.85