This model is a fine-tuned version of the dnhkng/RYS-XLarge, pushing the boundaries of natural language understanding and generation even further.
Tools
35 Pulls Updated 9 days ago
4b96a160a905 · 32GB
-
mradermacher.convert_typehf
-
mradermacher.quantize_version2
-
mradermacher.quantized_at2024-08-13T08:15:55+02:00
-
mradermacher.quantized_bymradermacher
-
mradermacher.quantized_ondb2
-
quantize.imatrix.chunks_count318
-
quantize.imatrix.datasetimatrix-training-full-3
-
quantize.imatrix.entries_count602
-
quantize.imatrix.filecalme-2.4-rys-78b-i1-GGUF/imatrix.dat
-
general.architectureqwen2
-
general.file_typeQ2_K
-
qwen2.attention.head_count64
-
qwen2.attention.head_count_kv8
-
qwen2.attention.layer_norm_rms_epsilon1e-06
-
qwen2.block_count86
-
qwen2.context_length32768
-
qwen2.embedding_length8192
-
qwen2.feed_forward_length29568
-
qwen2.rope.freq_base1e+06
-
tokenizer.ggml.eos_token_id151645
-
tokenizer.ggml.merges[Ġ Ġ ĠĠ ĠĠ i n Ġ t ĠĠĠĠ ĠĠĠĠ ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id151643
-
tokenizer.ggml.preqwen2
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weightQ2_K[8192 151646]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.0.ffn_gate.weightQ2_K[8192 29568]
-
blk.0.ffn_up.weightQ2_K[8192 29568]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.attn_k.biasF32[1024]
-
blk.0.attn_k.weightQ2_K[8192 1024]
-
blk.0.attn_output.weightQ3_K[8192 8192]
-
blk.0.attn_q.biasF32[8192]
-
blk.0.attn_q.weightQ2_K[8192 8192]
-
blk.0.attn_v.biasF32[1024]
-
blk.0.attn_v.weightQ4_K[8192 1024]
-
blk.1.attn_k.biasF32[1024]
-
blk.1.attn_k.weightQ2_K[8192 1024]
-
blk.1.attn_output.weightQ3_K[8192 8192]
-
blk.1.attn_q.biasF32[8192]
-
blk.1.attn_q.weightQ2_K[8192 8192]
-
blk.1.attn_v.biasF32[1024]
-
blk.1.attn_v.weightQ4_K[8192 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.1.ffn_gate.weightQ2_K[8192 29568]
-
blk.1.ffn_up.weightQ2_K[8192 29568]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.2.ffn_gate.weightQ2_K[8192 29568]
-
blk.2.attn_k.biasF32[1024]
-
blk.2.attn_k.weightQ2_K[8192 1024]
-
blk.2.attn_output.weightQ3_K[8192 8192]
-
blk.2.attn_q.biasF32[8192]
-
blk.2.attn_q.weightQ2_K[8192 8192]
-
blk.2.attn_v.biasF32[1024]
-
blk.2.attn_v.weightQ4_K[8192 1024]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.2.ffn_up.weightQ2_K[8192 29568]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.3.ffn_gate.weightQ2_K[8192 29568]
-
blk.3.ffn_up.weightQ2_K[8192 29568]
-
blk.3.attn_k.biasF32[1024]
-
blk.3.attn_k.weightQ2_K[8192 1024]
-
blk.3.attn_output.weightQ3_K[8192 8192]
-
blk.3.attn_q.biasF32[8192]
-
blk.3.attn_q.weightQ2_K[8192 8192]
-
blk.3.attn_v.biasF32[1024]
-
blk.3.attn_v.weightQ4_K[8192 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.4.ffn_gate.weightQ2_K[8192 29568]
-
blk.4.ffn_up.weightQ2_K[8192 29568]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.4.attn_k.biasF32[1024]
-
blk.4.attn_k.weightQ2_K[8192 1024]
-
blk.4.attn_output.weightQ3_K[8192 8192]
-
blk.4.attn_q.biasF32[8192]
-
blk.4.attn_q.weightQ2_K[8192 8192]
-
blk.4.attn_v.biasF32[1024]
-
blk.4.attn_v.weightQ4_K[8192 1024]
-
blk.5.attn_k.biasF32[1024]
-
blk.5.attn_k.weightQ2_K[8192 1024]
-
blk.5.attn_q.biasF32[8192]
-
blk.5.attn_q.weightQ2_K[8192 8192]
-
blk.5.attn_v.biasF32[1024]
-
blk.5.attn_v.weightQ4_K[8192 1024]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.5.ffn_gate.weightQ2_K[8192 29568]
-
blk.5.ffn_up.weightQ2_K[8192 29568]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.5.attn_output.weightQ3_K[8192 8192]
-
blk.6.ffn_gate.weightQ2_K[8192 29568]
-
blk.6.attn_k.biasF32[1024]
-
blk.6.attn_k.weightQ2_K[8192 1024]
-
blk.6.attn_output.weightQ3_K[8192 8192]
-
blk.6.attn_q.biasF32[8192]
-
blk.6.attn_q.weightQ2_K[8192 8192]
-
blk.6.attn_v.biasF32[1024]
-
blk.6.attn_v.weightQ4_K[8192 1024]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.6.ffn_up.weightQ2_K[8192 29568]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.7.ffn_gate.weightQ2_K[8192 29568]
-
blk.7.ffn_up.weightQ2_K[8192 29568]
-
blk.7.attn_k.biasF32[1024]
-
blk.7.attn_k.weightQ2_K[8192 1024]
-
blk.7.attn_output.weightQ3_K[8192 8192]
-
blk.7.attn_q.biasF32[8192]
-
blk.7.attn_q.weightQ2_K[8192 8192]
-
blk.7.attn_v.biasF32[1024]
-
blk.7.attn_v.weightQ4_K[8192 1024]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.8.ffn_gate.weightQ2_K[8192 29568]
-
blk.8.ffn_up.weightQ2_K[8192 29568]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.attn_k.biasF32[1024]
-
blk.8.attn_k.weightQ2_K[8192 1024]
-
blk.8.attn_output.weightQ3_K[8192 8192]
-
blk.8.attn_q.biasF32[8192]
-
blk.8.attn_q.weightQ2_K[8192 8192]
-
blk.8.attn_v.biasF32[1024]
-
blk.8.attn_v.weightQ4_K[8192 1024]
-
blk.9.attn_k.biasF32[1024]
-
blk.9.attn_k.weightQ2_K[8192 1024]
-
blk.9.attn_q.biasF32[8192]
-
blk.9.attn_q.weightQ2_K[8192 8192]
-
blk.9.attn_v.biasF32[1024]
-
blk.9.attn_v.weightQ4_K[8192 1024]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.9.ffn_gate.weightQ2_K[8192 29568]
-
blk.9.ffn_up.weightQ2_K[8192 29568]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.attn_output.weightQ3_K[8192 8192]
-
blk.10.ffn_gate.weightQ2_K[8192 29568]
-
blk.10.attn_k.biasF32[1024]
-
blk.10.attn_k.weightQ2_K[8192 1024]
-
blk.10.attn_output.weightQ3_K[8192 8192]
-
blk.10.attn_q.biasF32[8192]
-
blk.10.attn_q.weightQ2_K[8192 8192]
-
blk.10.attn_v.biasF32[1024]
-
blk.10.attn_v.weightQ4_K[8192 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.10.ffn_up.weightQ2_K[8192 29568]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.11.ffn_gate.weightQ2_K[8192 29568]
-
blk.11.ffn_up.weightQ2_K[8192 29568]
-
blk.11.attn_k.biasF32[1024]
-
blk.11.attn_k.weightQ2_K[8192 1024]
-
blk.11.attn_output.weightQ3_K[8192 8192]
-
blk.11.attn_q.biasF32[8192]
-
blk.11.attn_q.weightQ2_K[8192 8192]
-
blk.11.attn_v.biasF32[1024]
-
blk.11.attn_v.weightQ4_K[8192 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.12.ffn_gate.weightQ2_K[8192 29568]
-
blk.12.ffn_up.weightQ2_K[8192 29568]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.12.attn_k.biasF32[1024]
-
blk.12.attn_k.weightQ2_K[8192 1024]
-
blk.12.attn_output.weightQ3_K[8192 8192]
-
blk.12.attn_q.biasF32[8192]
-
blk.12.attn_q.weightQ2_K[8192 8192]
-
blk.12.attn_v.biasF32[1024]
-
blk.12.attn_v.weightQ4_K[8192 1024]
-
blk.13.attn_k.biasF32[1024]
-
blk.13.attn_k.weightQ2_K[8192 1024]
-
blk.13.attn_q.biasF32[8192]
-
blk.13.attn_q.weightQ2_K[8192 8192]
-
blk.13.attn_v.biasF32[1024]
-
blk.13.attn_v.weightQ4_K[8192 1024]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.13.ffn_gate.weightQ2_K[8192 29568]
-
blk.13.ffn_up.weightQ2_K[8192 29568]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.13.attn_output.weightQ3_K[8192 8192]
-
blk.14.ffn_gate.weightQ2_K[8192 29568]
-
blk.14.attn_k.biasF32[1024]
-
blk.14.attn_k.weightQ2_K[8192 1024]
-
blk.14.attn_output.weightQ3_K[8192 8192]
-
blk.14.attn_q.biasF32[8192]
-
blk.14.attn_q.weightQ2_K[8192 8192]
-
blk.14.attn_v.biasF32[1024]
-
blk.14.attn_v.weightQ4_K[8192 1024]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.14.ffn_up.weightQ2_K[8192 29568]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.15.ffn_gate.weightQ2_K[8192 29568]
-
blk.15.ffn_up.weightQ2_K[8192 29568]
-
blk.15.attn_k.biasF32[1024]
-
blk.15.attn_k.weightQ2_K[8192 1024]
-
blk.15.attn_output.weightQ3_K[8192 8192]
-
blk.15.attn_q.biasF32[8192]
-
blk.15.attn_q.weightQ2_K[8192 8192]
-
blk.15.attn_v.biasF32[1024]
-
blk.15.attn_v.weightQ4_K[8192 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.16.ffn_gate.weightQ2_K[8192 29568]
-
blk.16.ffn_up.weightQ2_K[8192 29568]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.16.attn_k.biasF32[1024]
-
blk.16.attn_k.weightQ2_K[8192 1024]
-
blk.16.attn_output.weightQ3_K[8192 8192]
-
blk.16.attn_q.biasF32[8192]
-
blk.16.attn_q.weightQ2_K[8192 8192]
-
blk.16.attn_v.biasF32[1024]
-
blk.16.attn_v.weightQ4_K[8192 1024]
-
blk.17.attn_k.biasF32[1024]
-
blk.17.attn_k.weightQ2_K[8192 1024]
-
blk.17.attn_q.biasF32[8192]
-
blk.17.attn_q.weightQ2_K[8192 8192]
-
blk.17.attn_v.biasF32[1024]
-
blk.17.attn_v.weightQ4_K[8192 1024]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.17.ffn_gate.weightQ2_K[8192 29568]
-
blk.17.ffn_up.weightQ2_K[8192 29568]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.17.attn_output.weightQ3_K[8192 8192]
-
blk.18.ffn_gate.weightQ2_K[8192 29568]
-
blk.18.attn_k.biasF32[1024]
-
blk.18.attn_k.weightQ2_K[8192 1024]
-
blk.18.attn_output.weightQ3_K[8192 8192]
-
blk.18.attn_q.biasF32[8192]
-
blk.18.attn_q.weightQ2_K[8192 8192]
-
blk.18.attn_v.biasF32[1024]
-
blk.18.attn_v.weightQ4_K[8192 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.18.ffn_up.weightQ2_K[8192 29568]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.19.ffn_gate.weightQ2_K[8192 29568]
-
blk.19.ffn_up.weightQ2_K[8192 29568]
-
blk.19.attn_k.biasF32[1024]
-
blk.19.attn_k.weightQ2_K[8192 1024]
-
blk.19.attn_output.weightQ3_K[8192 8192]
-
blk.19.attn_q.biasF32[8192]
-
blk.19.attn_q.weightQ2_K[8192 8192]
-
blk.19.attn_v.biasF32[1024]
-
blk.19.attn_v.weightQ4_K[8192 1024]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.20.ffn_gate.weightQ2_K[8192 29568]
-
blk.20.ffn_up.weightQ2_K[8192 29568]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.20.attn_k.biasF32[1024]
-
blk.20.attn_k.weightQ2_K[8192 1024]
-
blk.20.attn_output.weightQ3_K[8192 8192]
-
blk.20.attn_q.biasF32[8192]
-
blk.20.attn_q.weightQ2_K[8192 8192]
-
blk.20.attn_v.biasF32[1024]
-
blk.20.attn_v.weightQ4_K[8192 1024]
-
blk.21.attn_k.biasF32[1024]
-
blk.21.attn_k.weightQ2_K[8192 1024]
-
blk.21.attn_q.biasF32[8192]
-
blk.21.attn_q.weightQ2_K[8192 8192]
-
blk.21.attn_v.biasF32[1024]
-
blk.21.attn_v.weightQ4_K[8192 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.21.ffn_gate.weightQ2_K[8192 29568]
-
blk.21.ffn_up.weightQ2_K[8192 29568]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.attn_output.weightQ3_K[8192 8192]
-
blk.22.ffn_gate.weightQ2_K[8192 29568]
-
blk.22.attn_k.biasF32[1024]
-
blk.22.attn_k.weightQ2_K[8192 1024]
-
blk.22.attn_output.weightQ3_K[8192 8192]
-
blk.22.attn_q.biasF32[8192]
-
blk.22.attn_q.weightQ2_K[8192 8192]
-
blk.22.attn_v.biasF32[1024]
-
blk.22.attn_v.weightQ4_K[8192 1024]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.22.ffn_up.weightQ2_K[8192 29568]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.23.ffn_gate.weightQ2_K[8192 29568]
-
blk.23.ffn_up.weightQ2_K[8192 29568]
-
blk.23.attn_k.biasF32[1024]
-
blk.23.attn_k.weightQ2_K[8192 1024]
-
blk.23.attn_output.weightQ3_K[8192 8192]
-
blk.23.attn_q.biasF32[8192]
-
blk.23.attn_q.weightQ2_K[8192 8192]
-
blk.23.attn_v.biasF32[1024]
-
blk.23.attn_v.weightQ4_K[8192 1024]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.24.ffn_gate.weightQ2_K[8192 29568]
-
blk.24.ffn_up.weightQ2_K[8192 29568]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.attn_k.biasF32[1024]
-
blk.24.attn_k.weightQ2_K[8192 1024]
-
blk.24.attn_output.weightQ3_K[8192 8192]
-
blk.24.attn_q.biasF32[8192]
-
blk.24.attn_q.weightQ2_K[8192 8192]
-
blk.24.attn_v.biasF32[1024]
-
blk.24.attn_v.weightQ4_K[8192 1024]
-
blk.25.attn_k.biasF32[1024]
-
blk.25.attn_k.weightQ2_K[8192 1024]
-
blk.25.attn_q.biasF32[8192]
-
blk.25.attn_q.weightQ2_K[8192 8192]
-
blk.25.attn_v.biasF32[1024]
-
blk.25.attn_v.weightQ4_K[8192 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.25.ffn_gate.weightQ2_K[8192 29568]
-
blk.25.ffn_up.weightQ2_K[8192 29568]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.attn_output.weightQ3_K[8192 8192]
-
blk.26.ffn_gate.weightQ2_K[8192 29568]
-
blk.26.attn_k.biasF32[1024]
-
blk.26.attn_k.weightQ2_K[8192 1024]
-
blk.26.attn_output.weightQ3_K[8192 8192]
-
blk.26.attn_q.biasF32[8192]
-
blk.26.attn_q.weightQ2_K[8192 8192]
-
blk.26.attn_v.biasF32[1024]
-
blk.26.attn_v.weightQ4_K[8192 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.26.ffn_up.weightQ2_K[8192 29568]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.27.ffn_gate.weightQ2_K[8192 29568]
-
blk.27.ffn_up.weightQ2_K[8192 29568]
-
blk.27.attn_k.biasF32[1024]
-
blk.27.attn_k.weightQ2_K[8192 1024]
-
blk.27.attn_output.weightQ3_K[8192 8192]
-
blk.27.attn_q.biasF32[8192]
-
blk.27.attn_q.weightQ2_K[8192 8192]
-
blk.27.attn_v.biasF32[1024]
-
blk.27.attn_v.weightQ4_K[8192 1024]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.28.ffn_gate.weightQ2_K[8192 29568]
-
blk.28.ffn_up.weightQ2_K[8192 29568]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.attn_k.biasF32[1024]
-
blk.28.attn_k.weightQ2_K[8192 1024]
-
blk.28.attn_output.weightQ3_K[8192 8192]
-
blk.28.attn_q.biasF32[8192]
-
blk.28.attn_q.weightQ2_K[8192 8192]
-
blk.28.attn_v.biasF32[1024]
-
blk.28.attn_v.weightQ4_K[8192 1024]
-
blk.29.attn_k.biasF32[1024]
-
blk.29.attn_k.weightQ2_K[8192 1024]
-
blk.29.attn_q.biasF32[8192]
-
blk.29.attn_q.weightQ2_K[8192 8192]
-
blk.29.attn_v.biasF32[1024]
-
blk.29.attn_v.weightQ4_K[8192 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.29.ffn_gate.weightQ2_K[8192 29568]
-
blk.29.ffn_up.weightQ2_K[8192 29568]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.29.attn_output.weightQ3_K[8192 8192]
-
blk.30.ffn_gate.weightQ2_K[8192 29568]
-
blk.30.attn_k.biasF32[1024]
-
blk.30.attn_k.weightQ2_K[8192 1024]
-
blk.30.attn_output.weightQ3_K[8192 8192]
-
blk.30.attn_q.biasF32[8192]
-
blk.30.attn_q.weightQ2_K[8192 8192]
-
blk.30.attn_v.biasF32[1024]
-
blk.30.attn_v.weightQ4_K[8192 1024]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.30.ffn_up.weightQ2_K[8192 29568]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.31.ffn_gate.weightQ2_K[8192 29568]
-
blk.31.ffn_up.weightQ2_K[8192 29568]
-
blk.31.attn_k.biasF32[1024]
-
blk.31.attn_k.weightQ2_K[8192 1024]
-
blk.31.attn_output.weightQ3_K[8192 8192]
-
blk.31.attn_q.biasF32[8192]
-
blk.31.attn_q.weightQ2_K[8192 8192]
-
blk.31.attn_v.biasF32[1024]
-
blk.31.attn_v.weightQ4_K[8192 1024]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.32.ffn_gate.weightQ2_K[8192 29568]
-
blk.32.ffn_up.weightQ2_K[8192 29568]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.32.attn_k.biasF32[1024]
-
blk.32.attn_k.weightQ2_K[8192 1024]
-
blk.32.attn_output.weightQ3_K[8192 8192]
-
blk.32.attn_q.biasF32[8192]
-
blk.32.attn_q.weightQ2_K[8192 8192]
-
blk.32.attn_v.biasF32[1024]
-
blk.32.attn_v.weightQ4_K[8192 1024]
-
blk.33.attn_k.biasF32[1024]
-
blk.33.attn_k.weightQ2_K[8192 1024]
-
blk.33.attn_q.biasF32[8192]
-
blk.33.attn_q.weightQ2_K[8192 8192]
-
blk.33.attn_v.biasF32[1024]
-
blk.33.attn_v.weightQ4_K[8192 1024]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.33.ffn_gate.weightQ2_K[8192 29568]
-
blk.33.ffn_up.weightQ2_K[8192 29568]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.33.attn_output.weightQ3_K[8192 8192]
-
blk.34.ffn_gate.weightQ2_K[8192 29568]
-
blk.34.attn_k.biasF32[1024]
-
blk.34.attn_k.weightQ2_K[8192 1024]
-
blk.34.attn_output.weightQ3_K[8192 8192]
-
blk.34.attn_q.biasF32[8192]
-
blk.34.attn_q.weightQ2_K[8192 8192]
-
blk.34.attn_v.biasF32[1024]
-
blk.34.attn_v.weightQ4_K[8192 1024]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.34.ffn_up.weightQ2_K[8192 29568]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.35.ffn_gate.weightQ2_K[8192 29568]
-
blk.35.ffn_up.weightQ2_K[8192 29568]
-
blk.35.attn_k.biasF32[1024]
-
blk.35.attn_k.weightQ2_K[8192 1024]
-
blk.35.attn_output.weightQ3_K[8192 8192]
-
blk.35.attn_q.biasF32[8192]
-
blk.35.attn_q.weightQ2_K[8192 8192]
-
blk.35.attn_v.biasF32[1024]
-
blk.35.attn_v.weightQ4_K[8192 1024]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.36.ffn_gate.weightQ2_K[8192 29568]
-
blk.36.ffn_up.weightQ2_K[8192 29568]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.attn_k.biasF32[1024]
-
blk.36.attn_k.weightQ2_K[8192 1024]
-
blk.36.attn_output.weightQ3_K[8192 8192]
-
blk.36.attn_q.biasF32[8192]
-
blk.36.attn_q.weightQ2_K[8192 8192]
-
blk.36.attn_v.biasF32[1024]
-
blk.36.attn_v.weightQ4_K[8192 1024]
-
blk.37.attn_k.biasF32[1024]
-
blk.37.attn_k.weightQ2_K[8192 1024]
-
blk.37.attn_q.biasF32[8192]
-
blk.37.attn_q.weightQ2_K[8192 8192]
-
blk.37.attn_v.biasF32[1024]
-
blk.37.attn_v.weightQ4_K[8192 1024]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.37.ffn_gate.weightQ2_K[8192 29568]
-
blk.37.ffn_up.weightQ2_K[8192 29568]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.attn_output.weightQ3_K[8192 8192]
-
blk.38.ffn_gate.weightQ2_K[8192 29568]
-
blk.38.attn_k.biasF32[1024]
-
blk.38.attn_k.weightQ2_K[8192 1024]
-
blk.38.attn_output.weightQ3_K[8192 8192]
-
blk.38.attn_q.biasF32[8192]
-
blk.38.attn_q.weightQ2_K[8192 8192]
-
blk.38.attn_v.biasF32[1024]
-
blk.38.attn_v.weightQ4_K[8192 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.38.ffn_up.weightQ2_K[8192 29568]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.39.ffn_gate.weightQ2_K[8192 29568]
-
blk.39.ffn_up.weightQ2_K[8192 29568]
-
blk.39.attn_k.biasF32[1024]
-
blk.39.attn_k.weightQ2_K[8192 1024]
-
blk.39.attn_output.weightQ3_K[8192 8192]
-
blk.39.attn_q.biasF32[8192]
-
blk.39.attn_q.weightQ2_K[8192 8192]
-
blk.39.attn_v.biasF32[1024]
-
blk.39.attn_v.weightQ4_K[8192 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.40.ffn_gate.weightQ2_K[8192 29568]
-
blk.40.ffn_up.weightQ2_K[8192 29568]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.40.attn_k.biasF32[1024]
-
blk.40.attn_k.weightQ2_K[8192 1024]
-
blk.40.attn_output.weightQ3_K[8192 8192]
-
blk.40.attn_q.biasF32[8192]
-
blk.40.attn_q.weightQ2_K[8192 8192]
-
blk.40.attn_v.biasF32[1024]
-
blk.40.attn_v.weightQ4_K[8192 1024]
-
blk.41.attn_k.biasF32[1024]
-
blk.41.attn_k.weightQ2_K[8192 1024]
-
blk.41.attn_q.biasF32[8192]
-
blk.41.attn_q.weightQ2_K[8192 8192]
-
blk.41.attn_v.biasF32[1024]
-
blk.41.attn_v.weightQ4_K[8192 1024]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.41.ffn_gate.weightQ2_K[8192 29568]
-
blk.41.ffn_up.weightQ2_K[8192 29568]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.41.attn_output.weightQ3_K[8192 8192]
-
blk.42.ffn_gate.weightQ2_K[8192 29568]
-
blk.42.attn_k.biasF32[1024]
-
blk.42.attn_k.weightQ2_K[8192 1024]
-
blk.42.attn_output.weightQ3_K[8192 8192]
-
blk.42.attn_q.biasF32[8192]
-
blk.42.attn_q.weightQ2_K[8192 8192]
-
blk.42.attn_v.biasF32[1024]
-
blk.42.attn_v.weightQ4_K[8192 1024]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.42.ffn_up.weightQ2_K[8192 29568]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.43.ffn_gate.weightQ2_K[8192 29568]
-
blk.43.ffn_up.weightQ2_K[8192 29568]
-
blk.43.attn_k.biasF32[1024]
-
blk.43.attn_k.weightQ2_K[8192 1024]
-
blk.43.attn_output.weightQ3_K[8192 8192]
-
blk.43.attn_q.biasF32[8192]
-
blk.43.attn_q.weightQ2_K[8192 8192]
-
blk.43.attn_v.biasF32[1024]
-
blk.43.attn_v.weightQ4_K[8192 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.44.ffn_gate.weightQ2_K[8192 29568]
-
blk.44.ffn_up.weightQ2_K[8192 29568]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.44.attn_k.biasF32[1024]
-
blk.44.attn_k.weightQ2_K[8192 1024]
-
blk.44.attn_output.weightQ3_K[8192 8192]
-
blk.44.attn_q.biasF32[8192]
-
blk.44.attn_q.weightQ2_K[8192 8192]
-
blk.44.attn_v.biasF32[1024]
-
blk.44.attn_v.weightQ4_K[8192 1024]
-
blk.45.attn_k.biasF32[1024]
-
blk.45.attn_k.weightQ2_K[8192 1024]
-
blk.45.attn_q.biasF32[8192]
-
blk.45.attn_q.weightQ2_K[8192 8192]
-
blk.45.attn_v.biasF32[1024]
-
blk.45.attn_v.weightQ4_K[8192 1024]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.45.ffn_gate.weightQ2_K[8192 29568]
-
blk.45.ffn_up.weightQ2_K[8192 29568]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.attn_output.weightQ3_K[8192 8192]
-
blk.46.ffn_gate.weightQ2_K[8192 29568]
-
blk.46.attn_k.biasF32[1024]
-
blk.46.attn_k.weightQ2_K[8192 1024]
-
blk.46.attn_output.weightQ3_K[8192 8192]
-
blk.46.attn_q.biasF32[8192]
-
blk.46.attn_q.weightQ2_K[8192 8192]
-
blk.46.attn_v.biasF32[1024]
-
blk.46.attn_v.weightQ4_K[8192 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.46.ffn_up.weightQ2_K[8192 29568]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.47.ffn_gate.weightQ2_K[8192 29568]
-
blk.47.ffn_up.weightQ2_K[8192 29568]
-
blk.47.attn_k.biasF32[1024]
-
blk.47.attn_k.weightQ2_K[8192 1024]
-
blk.47.attn_output.weightQ3_K[8192 8192]
-
blk.47.attn_q.biasF32[8192]
-
blk.47.attn_q.weightQ2_K[8192 8192]
-
blk.47.attn_v.biasF32[1024]
-
blk.47.attn_v.weightQ4_K[8192 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.48.ffn_gate.weightQ2_K[8192 29568]
-
blk.48.ffn_up.weightQ2_K[8192 29568]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.48.attn_k.biasF32[1024]
-
blk.48.attn_k.weightQ2_K[8192 1024]
-
blk.48.attn_output.weightQ3_K[8192 8192]
-
blk.48.attn_q.biasF32[8192]
-
blk.48.attn_q.weightQ2_K[8192 8192]
-
blk.48.attn_v.biasF32[1024]
-
blk.48.attn_v.weightQ4_K[8192 1024]
-
blk.49.attn_k.biasF32[1024]
-
blk.49.attn_k.weightQ2_K[8192 1024]
-
blk.49.attn_q.biasF32[8192]
-
blk.49.attn_q.weightQ2_K[8192 8192]
-
blk.49.attn_v.biasF32[1024]
-
blk.49.attn_v.weightQ4_K[8192 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.49.ffn_gate.weightQ2_K[8192 29568]
-
blk.49.ffn_up.weightQ2_K[8192 29568]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.49.attn_output.weightQ3_K[8192 8192]
-
blk.50.ffn_gate.weightQ2_K[8192 29568]
-
blk.50.attn_k.biasF32[1024]
-
blk.50.attn_k.weightQ2_K[8192 1024]
-
blk.50.attn_output.weightQ3_K[8192 8192]
-
blk.50.attn_q.biasF32[8192]
-
blk.50.attn_q.weightQ2_K[8192 8192]
-
blk.50.attn_v.biasF32[1024]
-
blk.50.attn_v.weightQ4_K[8192 1024]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.50.ffn_up.weightQ2_K[8192 29568]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.51.ffn_gate.weightQ2_K[8192 29568]
-
blk.51.ffn_up.weightQ2_K[8192 29568]
-
blk.51.attn_k.biasF32[1024]
-
blk.51.attn_k.weightQ2_K[8192 1024]
-
blk.51.attn_output.weightQ3_K[8192 8192]
-
blk.51.attn_q.biasF32[8192]
-
blk.51.attn_q.weightQ2_K[8192 8192]
-
blk.51.attn_v.biasF32[1024]
-
blk.51.attn_v.weightQ4_K[8192 1024]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.52.ffn_gate.weightQ2_K[8192 29568]
-
blk.52.ffn_up.weightQ2_K[8192 29568]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.52.attn_k.biasF32[1024]
-
blk.52.attn_k.weightQ2_K[8192 1024]
-
blk.52.attn_output.weightQ3_K[8192 8192]
-
blk.52.attn_q.biasF32[8192]
-
blk.52.attn_q.weightQ2_K[8192 8192]
-
blk.52.attn_v.biasF32[1024]
-
blk.52.attn_v.weightQ4_K[8192 1024]
-
blk.53.attn_k.biasF32[1024]
-
blk.53.attn_k.weightQ2_K[8192 1024]
-
blk.53.attn_q.biasF32[8192]
-
blk.53.attn_q.weightQ2_K[8192 8192]
-
blk.53.attn_v.biasF32[1024]
-
blk.53.attn_v.weightQ4_K[8192 1024]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.53.ffn_gate.weightQ2_K[8192 29568]
-
blk.53.ffn_up.weightQ2_K[8192 29568]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.53.attn_output.weightQ3_K[8192 8192]
-
blk.54.ffn_gate.weightQ2_K[8192 29568]
-
blk.54.attn_k.biasF32[1024]
-
blk.54.attn_k.weightQ2_K[8192 1024]
-
blk.54.attn_output.weightQ3_K[8192 8192]
-
blk.54.attn_q.biasF32[8192]
-
blk.54.attn_q.weightQ2_K[8192 8192]
-
blk.54.attn_v.biasF32[1024]
-
blk.54.attn_v.weightQ4_K[8192 1024]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.54.ffn_up.weightQ2_K[8192 29568]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.55.ffn_gate.weightQ2_K[8192 29568]
-
blk.55.ffn_up.weightQ2_K[8192 29568]
-
blk.55.attn_k.biasF32[1024]
-
blk.55.attn_k.weightQ2_K[8192 1024]
-
blk.55.attn_output.weightQ3_K[8192 8192]
-
blk.55.attn_q.biasF32[8192]
-
blk.55.attn_q.weightQ2_K[8192 8192]
-
blk.55.attn_v.biasF32[1024]
-
blk.55.attn_v.weightQ4_K[8192 1024]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.56.ffn_gate.weightQ2_K[8192 29568]
-
blk.56.ffn_up.weightQ2_K[8192 29568]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.56.attn_k.biasF32[1024]
-
blk.56.attn_k.weightQ2_K[8192 1024]
-
blk.56.attn_output.weightQ3_K[8192 8192]
-
blk.56.attn_q.biasF32[8192]
-
blk.56.attn_q.weightQ2_K[8192 8192]
-
blk.56.attn_v.biasF32[1024]
-
blk.56.attn_v.weightQ4_K[8192 1024]
-
blk.57.attn_k.biasF32[1024]
-
blk.57.attn_k.weightQ2_K[8192 1024]
-
blk.57.attn_q.biasF32[8192]
-
blk.57.attn_q.weightQ2_K[8192 8192]
-
blk.57.attn_v.biasF32[1024]
-
blk.57.attn_v.weightQ4_K[8192 1024]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.57.ffn_gate.weightQ2_K[8192 29568]
-
blk.57.ffn_up.weightQ2_K[8192 29568]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.57.attn_output.weightQ3_K[8192 8192]
-
blk.58.ffn_gate.weightQ2_K[8192 29568]
-
blk.58.attn_k.biasF32[1024]
-
blk.58.attn_k.weightQ2_K[8192 1024]
-
blk.58.attn_output.weightQ3_K[8192 8192]
-
blk.58.attn_q.biasF32[8192]
-
blk.58.attn_q.weightQ2_K[8192 8192]
-
blk.58.attn_v.biasF32[1024]
-
blk.58.attn_v.weightQ4_K[8192 1024]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.58.ffn_up.weightQ2_K[8192 29568]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.59.ffn_gate.weightQ2_K[8192 29568]
-
blk.59.ffn_up.weightQ2_K[8192 29568]
-
blk.59.attn_k.biasF32[1024]
-
blk.59.attn_k.weightQ2_K[8192 1024]
-
blk.59.attn_output.weightQ3_K[8192 8192]
-
blk.59.attn_q.biasF32[8192]
-
blk.59.attn_q.weightQ2_K[8192 8192]
-
blk.59.attn_v.biasF32[1024]
-
blk.59.attn_v.weightQ4_K[8192 1024]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.60.ffn_gate.weightQ2_K[8192 29568]
-
blk.60.ffn_up.weightQ2_K[8192 29568]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.60.attn_k.biasF32[1024]
-
blk.60.attn_k.weightQ2_K[8192 1024]
-
blk.60.attn_output.weightQ3_K[8192 8192]
-
blk.60.attn_q.biasF32[8192]
-
blk.60.attn_q.weightQ2_K[8192 8192]
-
blk.60.attn_v.biasF32[1024]
-
blk.60.attn_v.weightQ4_K[8192 1024]
-
blk.61.attn_k.biasF32[1024]
-
blk.61.attn_k.weightQ2_K[8192 1024]
-
blk.61.attn_q.biasF32[8192]
-
blk.61.attn_q.weightQ2_K[8192 8192]
-
blk.61.attn_v.biasF32[1024]
-
blk.61.attn_v.weightQ4_K[8192 1024]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.61.ffn_gate.weightQ2_K[8192 29568]
-
blk.61.ffn_up.weightQ2_K[8192 29568]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.61.attn_output.weightQ3_K[8192 8192]
-
blk.62.ffn_gate.weightQ2_K[8192 29568]
-
blk.62.attn_k.biasF32[1024]
-
blk.62.attn_k.weightQ2_K[8192 1024]
-
blk.62.attn_output.weightQ3_K[8192 8192]
-
blk.62.attn_q.biasF32[8192]
-
blk.62.attn_q.weightQ2_K[8192 8192]
-
blk.62.attn_v.biasF32[1024]
-
blk.62.attn_v.weightQ4_K[8192 1024]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.62.ffn_up.weightQ2_K[8192 29568]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.63.ffn_gate.weightQ2_K[8192 29568]
-
blk.63.ffn_up.weightQ2_K[8192 29568]
-
blk.63.attn_k.biasF32[1024]
-
blk.63.attn_k.weightQ2_K[8192 1024]
-
blk.63.attn_output.weightQ3_K[8192 8192]
-
blk.63.attn_q.biasF32[8192]
-
blk.63.attn_q.weightQ2_K[8192 8192]
-
blk.63.attn_v.biasF32[1024]
-
blk.63.attn_v.weightQ4_K[8192 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.64.ffn_gate.weightQ2_K[8192 29568]
-
blk.64.ffn_up.weightQ2_K[8192 29568]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.64.attn_k.biasF32[1024]
-
blk.64.attn_k.weightQ2_K[8192 1024]
-
blk.64.attn_output.weightQ3_K[8192 8192]
-
blk.64.attn_q.biasF32[8192]
-
blk.64.attn_q.weightQ2_K[8192 8192]
-
blk.64.attn_v.biasF32[1024]
-
blk.64.attn_v.weightQ4_K[8192 1024]
-
blk.65.attn_k.biasF32[1024]
-
blk.65.attn_k.weightQ2_K[8192 1024]
-
blk.65.attn_q.biasF32[8192]
-
blk.65.attn_q.weightQ2_K[8192 8192]
-
blk.65.attn_v.biasF32[1024]
-
blk.65.attn_v.weightQ4_K[8192 1024]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.65.ffn_gate.weightQ2_K[8192 29568]
-
blk.65.ffn_up.weightQ2_K[8192 29568]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.attn_output.weightQ3_K[8192 8192]
-
blk.66.ffn_gate.weightQ2_K[8192 29568]
-
blk.66.attn_k.biasF32[1024]
-
blk.66.attn_k.weightQ2_K[8192 1024]
-
blk.66.attn_output.weightQ3_K[8192 8192]
-
blk.66.attn_q.biasF32[8192]
-
blk.66.attn_q.weightQ2_K[8192 8192]
-
blk.66.attn_v.biasF32[1024]
-
blk.66.attn_v.weightQ4_K[8192 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.66.ffn_up.weightQ2_K[8192 29568]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.67.ffn_gate.weightQ2_K[8192 29568]
-
blk.67.ffn_up.weightQ2_K[8192 29568]
-
blk.67.attn_k.biasF32[1024]
-
blk.67.attn_k.weightQ2_K[8192 1024]
-
blk.67.attn_output.weightQ3_K[8192 8192]
-
blk.67.attn_q.biasF32[8192]
-
blk.67.attn_q.weightQ2_K[8192 8192]
-
blk.67.attn_v.biasF32[1024]
-
blk.67.attn_v.weightQ4_K[8192 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.68.ffn_gate.weightQ2_K[8192 29568]
-
blk.68.ffn_up.weightQ2_K[8192 29568]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.68.attn_k.biasF32[1024]
-
blk.68.attn_k.weightQ2_K[8192 1024]
-
blk.68.attn_output.weightQ3_K[8192 8192]
-
blk.68.attn_q.biasF32[8192]
-
blk.68.attn_q.weightQ2_K[8192 8192]
-
blk.68.attn_v.biasF32[1024]
-
blk.68.attn_v.weightQ4_K[8192 1024]
-
blk.69.attn_k.biasF32[1024]
-
blk.69.attn_k.weightQ2_K[8192 1024]
-
blk.69.attn_q.biasF32[8192]
-
blk.69.attn_q.weightQ2_K[8192 8192]
-
blk.69.attn_v.biasF32[1024]
-
blk.69.attn_v.weightQ4_K[8192 1024]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.69.ffn_gate.weightQ2_K[8192 29568]
-
blk.69.ffn_up.weightQ2_K[8192 29568]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.69.attn_output.weightQ3_K[8192 8192]
-
blk.70.ffn_gate.weightQ2_K[8192 29568]
-
blk.70.attn_k.biasF32[1024]
-
blk.70.attn_k.weightQ2_K[8192 1024]
-
blk.70.attn_output.weightQ3_K[8192 8192]
-
blk.70.attn_q.biasF32[8192]
-
blk.70.attn_q.weightQ2_K[8192 8192]
-
blk.70.attn_v.biasF32[1024]
-
blk.70.attn_v.weightQ4_K[8192 1024]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.70.ffn_up.weightQ2_K[8192 29568]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.71.ffn_gate.weightQ2_K[8192 29568]
-
blk.71.ffn_up.weightQ2_K[8192 29568]
-
blk.71.attn_k.biasF32[1024]
-
blk.71.attn_k.weightQ2_K[8192 1024]
-
blk.71.attn_output.weightQ3_K[8192 8192]
-
blk.71.attn_q.biasF32[8192]
-
blk.71.attn_q.weightQ2_K[8192 8192]
-
blk.71.attn_v.biasF32[1024]
-
blk.71.attn_v.weightQ4_K[8192 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.72.ffn_gate.weightQ2_K[8192 29568]
-
blk.72.ffn_up.weightQ2_K[8192 29568]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.72.attn_k.biasF32[1024]
-
blk.72.attn_k.weightQ2_K[8192 1024]
-
blk.72.attn_output.weightQ3_K[8192 8192]
-
blk.72.attn_q.biasF32[8192]
-
blk.72.attn_q.weightQ2_K[8192 8192]
-
blk.72.attn_v.biasF32[1024]
-
blk.72.attn_v.weightQ4_K[8192 1024]
-
blk.73.attn_k.biasF32[1024]
-
blk.73.attn_k.weightQ2_K[8192 1024]
-
blk.73.attn_q.biasF32[8192]
-
blk.73.attn_q.weightQ2_K[8192 8192]
-
blk.73.attn_v.biasF32[1024]
-
blk.73.attn_v.weightQ4_K[8192 1024]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.73.ffn_gate.weightQ2_K[8192 29568]
-
blk.73.ffn_up.weightQ2_K[8192 29568]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.attn_output.weightQ3_K[8192 8192]
-
blk.74.ffn_gate.weightQ2_K[8192 29568]
-
blk.74.attn_k.biasF32[1024]
-
blk.74.attn_k.weightQ2_K[8192 1024]
-
blk.74.attn_output.weightQ3_K[8192 8192]
-
blk.74.attn_q.biasF32[8192]
-
blk.74.attn_q.weightQ2_K[8192 8192]
-
blk.74.attn_v.biasF32[1024]
-
blk.74.attn_v.weightQ4_K[8192 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.74.ffn_up.weightQ2_K[8192 29568]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.75.ffn_gate.weightQ2_K[8192 29568]
-
blk.75.ffn_up.weightQ2_K[8192 29568]
-
blk.75.attn_k.biasF32[1024]
-
blk.75.attn_k.weightQ2_K[8192 1024]
-
blk.75.attn_output.weightQ3_K[8192 8192]
-
blk.75.attn_q.biasF32[8192]
-
blk.75.attn_q.weightQ2_K[8192 8192]
-
blk.75.attn_v.biasF32[1024]
-
blk.75.attn_v.weightQ4_K[8192 1024]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.76.ffn_gate.weightQ2_K[8192 29568]
-
blk.76.ffn_up.weightQ2_K[8192 29568]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.attn_k.biasF32[1024]
-
blk.76.attn_k.weightQ2_K[8192 1024]
-
blk.76.attn_output.weightQ3_K[8192 8192]
-
blk.76.attn_q.biasF32[8192]
-
blk.76.attn_q.weightQ2_K[8192 8192]
-
blk.76.attn_v.biasF32[1024]
-
blk.76.attn_v.weightQ4_K[8192 1024]
-
blk.77.attn_k.biasF32[1024]
-
blk.77.attn_k.weightQ2_K[8192 1024]
-
blk.77.attn_q.biasF32[8192]
-
blk.77.attn_q.weightQ2_K[8192 8192]
-
blk.77.attn_v.biasF32[1024]
-
blk.77.attn_v.weightQ4_K[8192 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.77.ffn_gate.weightQ2_K[8192 29568]
-
blk.77.ffn_up.weightQ2_K[8192 29568]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.attn_output.weightQ3_K[8192 8192]
-
blk.78.ffn_gate.weightQ2_K[8192 29568]
-
blk.78.attn_k.biasF32[1024]
-
blk.78.attn_k.weightQ2_K[8192 1024]
-
blk.78.attn_output.weightQ3_K[8192 8192]
-
blk.78.attn_q.biasF32[8192]
-
blk.78.attn_q.weightQ2_K[8192 8192]
-
blk.78.attn_v.biasF32[1024]
-
blk.78.attn_v.weightQ4_K[8192 1024]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.78.ffn_up.weightQ2_K[8192 29568]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.79.ffn_gate.weightQ2_K[8192 29568]
-
blk.79.ffn_up.weightQ2_K[8192 29568]
-
blk.79.attn_k.biasF32[1024]
-
blk.79.attn_k.weightQ2_K[8192 1024]
-
blk.79.attn_output.weightQ3_K[8192 8192]
-
blk.79.attn_q.biasF32[8192]
-
blk.79.attn_q.weightQ2_K[8192 8192]
-
blk.79.attn_v.biasF32[1024]
-
blk.79.attn_v.weightQ4_K[8192 1024]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.80.attn_norm.weightF32[8192]
-
blk.80.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.80.ffn_gate.weightQ2_K[8192 29568]
-
blk.80.ffn_up.weightQ2_K[8192 29568]
-
blk.80.ffn_norm.weightF32[8192]
-
blk.80.attn_k.biasF32[1024]
-
blk.80.attn_k.weightQ2_K[8192 1024]
-
blk.80.attn_output.weightQ3_K[8192 8192]
-
blk.80.attn_q.biasF32[8192]
-
blk.80.attn_q.weightQ2_K[8192 8192]
-
blk.80.attn_v.biasF32[1024]
-
blk.80.attn_v.weightQ4_K[8192 1024]
-
blk.81.attn_k.biasF32[1024]
-
blk.81.attn_k.weightQ2_K[8192 1024]
-
blk.81.attn_q.biasF32[8192]
-
blk.81.attn_q.weightQ2_K[8192 8192]
-
blk.81.attn_v.biasF32[1024]
-
blk.81.attn_v.weightQ4_K[8192 1024]
-
blk.81.attn_norm.weightF32[8192]
-
blk.81.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.81.ffn_gate.weightQ2_K[8192 29568]
-
blk.81.ffn_up.weightQ2_K[8192 29568]
-
blk.81.ffn_norm.weightF32[8192]
-
blk.81.attn_output.weightQ3_K[8192 8192]
-
blk.82.ffn_gate.weightQ2_K[8192 29568]
-
blk.82.attn_k.biasF32[1024]
-
blk.82.attn_k.weightQ2_K[8192 1024]
-
blk.82.attn_output.weightQ3_K[8192 8192]
-
blk.82.attn_q.biasF32[8192]
-
blk.82.attn_q.weightQ2_K[8192 8192]
-
blk.82.attn_v.biasF32[1024]
-
blk.82.attn_v.weightQ4_K[8192 1024]
-
blk.82.attn_norm.weightF32[8192]
-
blk.82.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.82.ffn_up.weightQ2_K[8192 29568]
-
blk.82.ffn_norm.weightF32[8192]
-
blk.83.ffn_gate.weightQ2_K[8192 29568]
-
blk.83.ffn_up.weightQ2_K[8192 29568]
-
blk.83.attn_k.biasF32[1024]
-
blk.83.attn_k.weightQ2_K[8192 1024]
-
blk.83.attn_output.weightQ3_K[8192 8192]
-
blk.83.attn_q.biasF32[8192]
-
blk.83.attn_q.weightQ2_K[8192 8192]
-
blk.83.attn_v.biasF32[1024]
-
blk.83.attn_v.weightQ4_K[8192 1024]
-
blk.83.attn_norm.weightF32[8192]
-
blk.83.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.83.ffn_norm.weightF32[8192]
-
blk.84.attn_norm.weightF32[8192]
-
blk.84.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.84.ffn_gate.weightQ2_K[8192 29568]
-
blk.84.ffn_up.weightQ2_K[8192 29568]
-
blk.84.ffn_norm.weightF32[8192]
-
blk.84.attn_k.biasF32[1024]
-
blk.84.attn_k.weightQ2_K[8192 1024]
-
blk.84.attn_output.weightQ3_K[8192 8192]
-
blk.84.attn_q.biasF32[8192]
-
blk.84.attn_q.weightQ2_K[8192 8192]
-
blk.84.attn_v.biasF32[1024]
-
blk.84.attn_v.weightQ4_K[8192 1024]
-
blk.85.attn_k.biasF32[1024]
-
blk.85.attn_k.weightQ2_K[8192 1024]
-
blk.85.attn_q.biasF32[8192]
-
blk.85.attn_q.weightQ2_K[8192 8192]
-
blk.85.attn_v.biasF32[1024]
-
blk.85.attn_v.weightQ4_K[8192 1024]
-
blk.85.attn_norm.weightF32[8192]
-
blk.85.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.85.ffn_gate.weightQ2_K[8192 29568]
-
blk.85.ffn_up.weightQ2_K[8192 29568]
-
blk.85.ffn_norm.weightF32[8192]
-
blk.85.attn_output.weightQ3_K[8192 8192]
-
output_norm.weightF32[8192]
-
output.weightQ6_K[8192 151646]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79
blk.80
blk.81
blk.82
blk.83
blk.84
blk.85