This model is a fine-tuned version of the dnhkng/RYS-XLarge, pushing the boundaries of natural language understanding and generation even further.
Tools
36 Pulls Updated 9 days ago
8bc2b1fbc92f · 37GB
-
mradermacher.convert_typehf
-
mradermacher.quantize_version2
-
mradermacher.quantized_at2024-08-13T11:33:45+02:00
-
mradermacher.quantized_bymradermacher
-
mradermacher.quantized_ondb2
-
quantize.imatrix.chunks_count318
-
quantize.imatrix.datasetimatrix-training-full-3
-
quantize.imatrix.entries_count602
-
quantize.imatrix.filecalme-2.4-rys-78b-i1-GGUF/imatrix.dat
-
general.architectureqwen2
-
general.file_typeQ3_K_S
-
qwen2.attention.head_count64
-
qwen2.attention.head_count_kv8
-
qwen2.attention.layer_norm_rms_epsilon1e-06
-
qwen2.block_count86
-
qwen2.context_length32768
-
qwen2.embedding_length8192
-
qwen2.feed_forward_length29568
-
qwen2.rope.freq_base1e+06
-
tokenizer.ggml.eos_token_id151645
-
tokenizer.ggml.merges[Ġ Ġ ĠĠ ĠĠ i n Ġ t ĠĠĠĠ ĠĠĠĠ ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id151643
-
tokenizer.ggml.preqwen2
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
NameTypeShape
-
token_embd.weightQ3_K[8192 151646]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.0.ffn_gate.weightQ3_K[8192 29568]
-
blk.0.ffn_up.weightQ3_K[8192 29568]
-
blk.0.ffn_norm.weightF32[8192]
-
blk.0.attn_k.biasF32[1024]
-
blk.0.attn_k.weightQ3_K[8192 1024]
-
blk.0.attn_output.weightQ3_K[8192 8192]
-
blk.0.attn_q.biasF32[8192]
-
blk.0.attn_q.weightQ3_K[8192 8192]
-
blk.0.attn_v.biasF32[1024]
-
blk.0.attn_v.weightQ3_K[8192 1024]
-
blk.1.attn_k.biasF32[1024]
-
blk.1.attn_k.weightQ3_K[8192 1024]
-
blk.1.attn_output.weightQ3_K[8192 8192]
-
blk.1.attn_q.biasF32[8192]
-
blk.1.attn_q.weightQ3_K[8192 8192]
-
blk.1.attn_v.biasF32[1024]
-
blk.1.attn_v.weightQ3_K[8192 1024]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.1.ffn_gate.weightQ3_K[8192 29568]
-
blk.1.ffn_up.weightQ3_K[8192 29568]
-
blk.1.ffn_norm.weightF32[8192]
-
blk.2.ffn_gate.weightQ3_K[8192 29568]
-
blk.2.attn_k.biasF32[1024]
-
blk.2.attn_k.weightQ3_K[8192 1024]
-
blk.2.attn_output.weightQ3_K[8192 8192]
-
blk.2.attn_q.biasF32[8192]
-
blk.2.attn_q.weightQ3_K[8192 8192]
-
blk.2.attn_v.biasF32[1024]
-
blk.2.attn_v.weightQ3_K[8192 1024]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.2.ffn_up.weightQ3_K[8192 29568]
-
blk.2.ffn_norm.weightF32[8192]
-
blk.3.ffn_gate.weightQ3_K[8192 29568]
-
blk.3.ffn_up.weightQ3_K[8192 29568]
-
blk.3.attn_k.biasF32[1024]
-
blk.3.attn_k.weightQ3_K[8192 1024]
-
blk.3.attn_output.weightQ3_K[8192 8192]
-
blk.3.attn_q.biasF32[8192]
-
blk.3.attn_q.weightQ3_K[8192 8192]
-
blk.3.attn_v.biasF32[1024]
-
blk.3.attn_v.weightQ3_K[8192 1024]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.3.ffn_norm.weightF32[8192]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.4.ffn_gate.weightQ3_K[8192 29568]
-
blk.4.ffn_up.weightQ3_K[8192 29568]
-
blk.4.ffn_norm.weightF32[8192]
-
blk.4.attn_k.biasF32[1024]
-
blk.4.attn_k.weightQ3_K[8192 1024]
-
blk.4.attn_output.weightQ3_K[8192 8192]
-
blk.4.attn_q.biasF32[8192]
-
blk.4.attn_q.weightQ3_K[8192 8192]
-
blk.4.attn_v.biasF32[1024]
-
blk.4.attn_v.weightQ3_K[8192 1024]
-
blk.5.attn_k.biasF32[1024]
-
blk.5.attn_k.weightQ3_K[8192 1024]
-
blk.5.attn_q.biasF32[8192]
-
blk.5.attn_q.weightQ3_K[8192 8192]
-
blk.5.attn_v.biasF32[1024]
-
blk.5.attn_v.weightQ3_K[8192 1024]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.5.ffn_gate.weightQ3_K[8192 29568]
-
blk.5.ffn_up.weightQ3_K[8192 29568]
-
blk.5.ffn_norm.weightF32[8192]
-
blk.5.attn_output.weightQ3_K[8192 8192]
-
blk.6.ffn_gate.weightQ3_K[8192 29568]
-
blk.6.attn_k.biasF32[1024]
-
blk.6.attn_k.weightQ3_K[8192 1024]
-
blk.6.attn_output.weightQ3_K[8192 8192]
-
blk.6.attn_q.biasF32[8192]
-
blk.6.attn_q.weightQ3_K[8192 8192]
-
blk.6.attn_v.biasF32[1024]
-
blk.6.attn_v.weightQ3_K[8192 1024]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.6.ffn_up.weightQ3_K[8192 29568]
-
blk.6.ffn_norm.weightF32[8192]
-
blk.7.ffn_gate.weightQ3_K[8192 29568]
-
blk.7.ffn_up.weightQ3_K[8192 29568]
-
blk.7.attn_k.biasF32[1024]
-
blk.7.attn_k.weightQ3_K[8192 1024]
-
blk.7.attn_output.weightQ3_K[8192 8192]
-
blk.7.attn_q.biasF32[8192]
-
blk.7.attn_q.weightQ3_K[8192 8192]
-
blk.7.attn_v.biasF32[1024]
-
blk.7.attn_v.weightQ3_K[8192 1024]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.7.ffn_norm.weightF32[8192]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.8.ffn_gate.weightQ3_K[8192 29568]
-
blk.8.ffn_up.weightQ3_K[8192 29568]
-
blk.8.ffn_norm.weightF32[8192]
-
blk.8.attn_k.biasF32[1024]
-
blk.8.attn_k.weightQ3_K[8192 1024]
-
blk.8.attn_output.weightQ3_K[8192 8192]
-
blk.8.attn_q.biasF32[8192]
-
blk.8.attn_q.weightQ3_K[8192 8192]
-
blk.8.attn_v.biasF32[1024]
-
blk.8.attn_v.weightQ3_K[8192 1024]
-
blk.9.attn_k.biasF32[1024]
-
blk.9.attn_k.weightQ3_K[8192 1024]
-
blk.9.attn_q.biasF32[8192]
-
blk.9.attn_q.weightQ3_K[8192 8192]
-
blk.9.attn_v.biasF32[1024]
-
blk.9.attn_v.weightQ3_K[8192 1024]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.9.ffn_gate.weightQ3_K[8192 29568]
-
blk.9.ffn_up.weightQ3_K[8192 29568]
-
blk.9.ffn_norm.weightF32[8192]
-
blk.9.attn_output.weightQ3_K[8192 8192]
-
blk.10.ffn_gate.weightQ3_K[8192 29568]
-
blk.10.attn_k.biasF32[1024]
-
blk.10.attn_k.weightQ3_K[8192 1024]
-
blk.10.attn_output.weightQ3_K[8192 8192]
-
blk.10.attn_q.biasF32[8192]
-
blk.10.attn_q.weightQ3_K[8192 8192]
-
blk.10.attn_v.biasF32[1024]
-
blk.10.attn_v.weightQ3_K[8192 1024]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.10.ffn_up.weightQ3_K[8192 29568]
-
blk.10.ffn_norm.weightF32[8192]
-
blk.11.ffn_gate.weightQ3_K[8192 29568]
-
blk.11.ffn_up.weightQ3_K[8192 29568]
-
blk.11.attn_k.biasF32[1024]
-
blk.11.attn_k.weightQ3_K[8192 1024]
-
blk.11.attn_output.weightQ3_K[8192 8192]
-
blk.11.attn_q.biasF32[8192]
-
blk.11.attn_q.weightQ3_K[8192 8192]
-
blk.11.attn_v.biasF32[1024]
-
blk.11.attn_v.weightQ3_K[8192 1024]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.11.ffn_norm.weightF32[8192]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.12.ffn_gate.weightQ3_K[8192 29568]
-
blk.12.ffn_up.weightQ3_K[8192 29568]
-
blk.12.ffn_norm.weightF32[8192]
-
blk.12.attn_k.biasF32[1024]
-
blk.12.attn_k.weightQ3_K[8192 1024]
-
blk.12.attn_output.weightQ3_K[8192 8192]
-
blk.12.attn_q.biasF32[8192]
-
blk.12.attn_q.weightQ3_K[8192 8192]
-
blk.12.attn_v.biasF32[1024]
-
blk.12.attn_v.weightQ3_K[8192 1024]
-
blk.13.attn_k.biasF32[1024]
-
blk.13.attn_k.weightQ3_K[8192 1024]
-
blk.13.attn_q.biasF32[8192]
-
blk.13.attn_q.weightQ3_K[8192 8192]
-
blk.13.attn_v.biasF32[1024]
-
blk.13.attn_v.weightQ3_K[8192 1024]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.13.ffn_gate.weightQ3_K[8192 29568]
-
blk.13.ffn_up.weightQ3_K[8192 29568]
-
blk.13.ffn_norm.weightF32[8192]
-
blk.13.attn_output.weightQ3_K[8192 8192]
-
blk.14.ffn_gate.weightQ3_K[8192 29568]
-
blk.14.attn_k.biasF32[1024]
-
blk.14.attn_k.weightQ3_K[8192 1024]
-
blk.14.attn_output.weightQ3_K[8192 8192]
-
blk.14.attn_q.biasF32[8192]
-
blk.14.attn_q.weightQ3_K[8192 8192]
-
blk.14.attn_v.biasF32[1024]
-
blk.14.attn_v.weightQ3_K[8192 1024]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.14.ffn_up.weightQ3_K[8192 29568]
-
blk.14.ffn_norm.weightF32[8192]
-
blk.15.ffn_gate.weightQ3_K[8192 29568]
-
blk.15.ffn_up.weightQ3_K[8192 29568]
-
blk.15.attn_k.biasF32[1024]
-
blk.15.attn_k.weightQ3_K[8192 1024]
-
blk.15.attn_output.weightQ3_K[8192 8192]
-
blk.15.attn_q.biasF32[8192]
-
blk.15.attn_q.weightQ3_K[8192 8192]
-
blk.15.attn_v.biasF32[1024]
-
blk.15.attn_v.weightQ3_K[8192 1024]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.15.ffn_norm.weightF32[8192]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.16.ffn_gate.weightQ3_K[8192 29568]
-
blk.16.ffn_up.weightQ3_K[8192 29568]
-
blk.16.ffn_norm.weightF32[8192]
-
blk.16.attn_k.biasF32[1024]
-
blk.16.attn_k.weightQ3_K[8192 1024]
-
blk.16.attn_output.weightQ3_K[8192 8192]
-
blk.16.attn_q.biasF32[8192]
-
blk.16.attn_q.weightQ3_K[8192 8192]
-
blk.16.attn_v.biasF32[1024]
-
blk.16.attn_v.weightQ3_K[8192 1024]
-
blk.17.attn_k.biasF32[1024]
-
blk.17.attn_k.weightQ3_K[8192 1024]
-
blk.17.attn_q.biasF32[8192]
-
blk.17.attn_q.weightQ3_K[8192 8192]
-
blk.17.attn_v.biasF32[1024]
-
blk.17.attn_v.weightQ3_K[8192 1024]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.17.ffn_gate.weightQ3_K[8192 29568]
-
blk.17.ffn_up.weightQ3_K[8192 29568]
-
blk.17.ffn_norm.weightF32[8192]
-
blk.17.attn_output.weightQ3_K[8192 8192]
-
blk.18.ffn_gate.weightQ3_K[8192 29568]
-
blk.18.attn_k.biasF32[1024]
-
blk.18.attn_k.weightQ3_K[8192 1024]
-
blk.18.attn_output.weightQ3_K[8192 8192]
-
blk.18.attn_q.biasF32[8192]
-
blk.18.attn_q.weightQ3_K[8192 8192]
-
blk.18.attn_v.biasF32[1024]
-
blk.18.attn_v.weightQ3_K[8192 1024]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.18.ffn_up.weightQ3_K[8192 29568]
-
blk.18.ffn_norm.weightF32[8192]
-
blk.19.ffn_gate.weightQ3_K[8192 29568]
-
blk.19.ffn_up.weightQ3_K[8192 29568]
-
blk.19.attn_k.biasF32[1024]
-
blk.19.attn_k.weightQ3_K[8192 1024]
-
blk.19.attn_output.weightQ3_K[8192 8192]
-
blk.19.attn_q.biasF32[8192]
-
blk.19.attn_q.weightQ3_K[8192 8192]
-
blk.19.attn_v.biasF32[1024]
-
blk.19.attn_v.weightQ3_K[8192 1024]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.19.ffn_norm.weightF32[8192]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.20.ffn_gate.weightQ3_K[8192 29568]
-
blk.20.ffn_up.weightQ3_K[8192 29568]
-
blk.20.ffn_norm.weightF32[8192]
-
blk.20.attn_k.biasF32[1024]
-
blk.20.attn_k.weightQ3_K[8192 1024]
-
blk.20.attn_output.weightQ3_K[8192 8192]
-
blk.20.attn_q.biasF32[8192]
-
blk.20.attn_q.weightQ3_K[8192 8192]
-
blk.20.attn_v.biasF32[1024]
-
blk.20.attn_v.weightQ3_K[8192 1024]
-
blk.21.attn_k.biasF32[1024]
-
blk.21.attn_k.weightQ3_K[8192 1024]
-
blk.21.attn_q.biasF32[8192]
-
blk.21.attn_q.weightQ3_K[8192 8192]
-
blk.21.attn_v.biasF32[1024]
-
blk.21.attn_v.weightQ3_K[8192 1024]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.21.ffn_gate.weightQ3_K[8192 29568]
-
blk.21.ffn_up.weightQ3_K[8192 29568]
-
blk.21.ffn_norm.weightF32[8192]
-
blk.21.attn_output.weightQ3_K[8192 8192]
-
blk.22.ffn_gate.weightQ3_K[8192 29568]
-
blk.22.attn_k.biasF32[1024]
-
blk.22.attn_k.weightQ3_K[8192 1024]
-
blk.22.attn_output.weightQ3_K[8192 8192]
-
blk.22.attn_q.biasF32[8192]
-
blk.22.attn_q.weightQ3_K[8192 8192]
-
blk.22.attn_v.biasF32[1024]
-
blk.22.attn_v.weightQ3_K[8192 1024]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.22.ffn_up.weightQ3_K[8192 29568]
-
blk.22.ffn_norm.weightF32[8192]
-
blk.23.ffn_gate.weightQ3_K[8192 29568]
-
blk.23.ffn_up.weightQ3_K[8192 29568]
-
blk.23.attn_k.biasF32[1024]
-
blk.23.attn_k.weightQ3_K[8192 1024]
-
blk.23.attn_output.weightQ3_K[8192 8192]
-
blk.23.attn_q.biasF32[8192]
-
blk.23.attn_q.weightQ3_K[8192 8192]
-
blk.23.attn_v.biasF32[1024]
-
blk.23.attn_v.weightQ3_K[8192 1024]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.23.ffn_norm.weightF32[8192]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.24.ffn_gate.weightQ3_K[8192 29568]
-
blk.24.ffn_up.weightQ3_K[8192 29568]
-
blk.24.ffn_norm.weightF32[8192]
-
blk.24.attn_k.biasF32[1024]
-
blk.24.attn_k.weightQ3_K[8192 1024]
-
blk.24.attn_output.weightQ3_K[8192 8192]
-
blk.24.attn_q.biasF32[8192]
-
blk.24.attn_q.weightQ3_K[8192 8192]
-
blk.24.attn_v.biasF32[1024]
-
blk.24.attn_v.weightQ3_K[8192 1024]
-
blk.25.attn_k.biasF32[1024]
-
blk.25.attn_k.weightQ3_K[8192 1024]
-
blk.25.attn_q.biasF32[8192]
-
blk.25.attn_q.weightQ3_K[8192 8192]
-
blk.25.attn_v.biasF32[1024]
-
blk.25.attn_v.weightQ3_K[8192 1024]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.25.ffn_gate.weightQ3_K[8192 29568]
-
blk.25.ffn_up.weightQ3_K[8192 29568]
-
blk.25.ffn_norm.weightF32[8192]
-
blk.25.attn_output.weightQ3_K[8192 8192]
-
blk.26.ffn_gate.weightQ3_K[8192 29568]
-
blk.26.attn_k.biasF32[1024]
-
blk.26.attn_k.weightQ3_K[8192 1024]
-
blk.26.attn_output.weightQ3_K[8192 8192]
-
blk.26.attn_q.biasF32[8192]
-
blk.26.attn_q.weightQ3_K[8192 8192]
-
blk.26.attn_v.biasF32[1024]
-
blk.26.attn_v.weightQ3_K[8192 1024]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.26.ffn_up.weightQ3_K[8192 29568]
-
blk.26.ffn_norm.weightF32[8192]
-
blk.27.ffn_gate.weightQ3_K[8192 29568]
-
blk.27.ffn_up.weightQ3_K[8192 29568]
-
blk.27.attn_k.biasF32[1024]
-
blk.27.attn_k.weightQ3_K[8192 1024]
-
blk.27.attn_output.weightQ3_K[8192 8192]
-
blk.27.attn_q.biasF32[8192]
-
blk.27.attn_q.weightQ3_K[8192 8192]
-
blk.27.attn_v.biasF32[1024]
-
blk.27.attn_v.weightQ3_K[8192 1024]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.27.ffn_norm.weightF32[8192]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.28.ffn_gate.weightQ3_K[8192 29568]
-
blk.28.ffn_up.weightQ3_K[8192 29568]
-
blk.28.ffn_norm.weightF32[8192]
-
blk.28.attn_k.biasF32[1024]
-
blk.28.attn_k.weightQ3_K[8192 1024]
-
blk.28.attn_output.weightQ3_K[8192 8192]
-
blk.28.attn_q.biasF32[8192]
-
blk.28.attn_q.weightQ3_K[8192 8192]
-
blk.28.attn_v.biasF32[1024]
-
blk.28.attn_v.weightQ3_K[8192 1024]
-
blk.29.attn_k.biasF32[1024]
-
blk.29.attn_k.weightQ3_K[8192 1024]
-
blk.29.attn_q.biasF32[8192]
-
blk.29.attn_q.weightQ3_K[8192 8192]
-
blk.29.attn_v.biasF32[1024]
-
blk.29.attn_v.weightQ3_K[8192 1024]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.29.ffn_gate.weightQ3_K[8192 29568]
-
blk.29.ffn_up.weightQ3_K[8192 29568]
-
blk.29.ffn_norm.weightF32[8192]
-
blk.29.attn_output.weightQ3_K[8192 8192]
-
blk.30.ffn_gate.weightQ3_K[8192 29568]
-
blk.30.attn_k.biasF32[1024]
-
blk.30.attn_k.weightQ3_K[8192 1024]
-
blk.30.attn_output.weightQ3_K[8192 8192]
-
blk.30.attn_q.biasF32[8192]
-
blk.30.attn_q.weightQ3_K[8192 8192]
-
blk.30.attn_v.biasF32[1024]
-
blk.30.attn_v.weightQ3_K[8192 1024]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.30.ffn_up.weightQ3_K[8192 29568]
-
blk.30.ffn_norm.weightF32[8192]
-
blk.31.ffn_gate.weightQ3_K[8192 29568]
-
blk.31.ffn_up.weightQ3_K[8192 29568]
-
blk.31.attn_k.biasF32[1024]
-
blk.31.attn_k.weightQ3_K[8192 1024]
-
blk.31.attn_output.weightQ3_K[8192 8192]
-
blk.31.attn_q.biasF32[8192]
-
blk.31.attn_q.weightQ3_K[8192 8192]
-
blk.31.attn_v.biasF32[1024]
-
blk.31.attn_v.weightQ3_K[8192 1024]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.31.ffn_norm.weightF32[8192]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.32.ffn_gate.weightQ3_K[8192 29568]
-
blk.32.ffn_up.weightQ3_K[8192 29568]
-
blk.32.ffn_norm.weightF32[8192]
-
blk.32.attn_k.biasF32[1024]
-
blk.32.attn_k.weightQ3_K[8192 1024]
-
blk.32.attn_output.weightQ3_K[8192 8192]
-
blk.32.attn_q.biasF32[8192]
-
blk.32.attn_q.weightQ3_K[8192 8192]
-
blk.32.attn_v.biasF32[1024]
-
blk.32.attn_v.weightQ3_K[8192 1024]
-
blk.33.attn_k.biasF32[1024]
-
blk.33.attn_k.weightQ3_K[8192 1024]
-
blk.33.attn_q.biasF32[8192]
-
blk.33.attn_q.weightQ3_K[8192 8192]
-
blk.33.attn_v.biasF32[1024]
-
blk.33.attn_v.weightQ3_K[8192 1024]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.33.ffn_gate.weightQ3_K[8192 29568]
-
blk.33.ffn_up.weightQ3_K[8192 29568]
-
blk.33.ffn_norm.weightF32[8192]
-
blk.33.attn_output.weightQ3_K[8192 8192]
-
blk.34.ffn_gate.weightQ3_K[8192 29568]
-
blk.34.attn_k.biasF32[1024]
-
blk.34.attn_k.weightQ3_K[8192 1024]
-
blk.34.attn_output.weightQ3_K[8192 8192]
-
blk.34.attn_q.biasF32[8192]
-
blk.34.attn_q.weightQ3_K[8192 8192]
-
blk.34.attn_v.biasF32[1024]
-
blk.34.attn_v.weightQ3_K[8192 1024]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.34.ffn_up.weightQ3_K[8192 29568]
-
blk.34.ffn_norm.weightF32[8192]
-
blk.35.ffn_gate.weightQ3_K[8192 29568]
-
blk.35.ffn_up.weightQ3_K[8192 29568]
-
blk.35.attn_k.biasF32[1024]
-
blk.35.attn_k.weightQ3_K[8192 1024]
-
blk.35.attn_output.weightQ3_K[8192 8192]
-
blk.35.attn_q.biasF32[8192]
-
blk.35.attn_q.weightQ3_K[8192 8192]
-
blk.35.attn_v.biasF32[1024]
-
blk.35.attn_v.weightQ3_K[8192 1024]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.35.ffn_norm.weightF32[8192]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.36.ffn_gate.weightQ3_K[8192 29568]
-
blk.36.ffn_up.weightQ3_K[8192 29568]
-
blk.36.ffn_norm.weightF32[8192]
-
blk.36.attn_k.biasF32[1024]
-
blk.36.attn_k.weightQ3_K[8192 1024]
-
blk.36.attn_output.weightQ3_K[8192 8192]
-
blk.36.attn_q.biasF32[8192]
-
blk.36.attn_q.weightQ3_K[8192 8192]
-
blk.36.attn_v.biasF32[1024]
-
blk.36.attn_v.weightQ3_K[8192 1024]
-
blk.37.attn_k.biasF32[1024]
-
blk.37.attn_k.weightQ3_K[8192 1024]
-
blk.37.attn_q.biasF32[8192]
-
blk.37.attn_q.weightQ3_K[8192 8192]
-
blk.37.attn_v.biasF32[1024]
-
blk.37.attn_v.weightQ3_K[8192 1024]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.37.ffn_gate.weightQ3_K[8192 29568]
-
blk.37.ffn_up.weightQ3_K[8192 29568]
-
blk.37.ffn_norm.weightF32[8192]
-
blk.37.attn_output.weightQ3_K[8192 8192]
-
blk.38.ffn_gate.weightQ3_K[8192 29568]
-
blk.38.attn_k.biasF32[1024]
-
blk.38.attn_k.weightQ3_K[8192 1024]
-
blk.38.attn_output.weightQ3_K[8192 8192]
-
blk.38.attn_q.biasF32[8192]
-
blk.38.attn_q.weightQ3_K[8192 8192]
-
blk.38.attn_v.biasF32[1024]
-
blk.38.attn_v.weightQ3_K[8192 1024]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.38.ffn_up.weightQ3_K[8192 29568]
-
blk.38.ffn_norm.weightF32[8192]
-
blk.39.ffn_gate.weightQ3_K[8192 29568]
-
blk.39.ffn_up.weightQ3_K[8192 29568]
-
blk.39.attn_k.biasF32[1024]
-
blk.39.attn_k.weightQ3_K[8192 1024]
-
blk.39.attn_output.weightQ3_K[8192 8192]
-
blk.39.attn_q.biasF32[8192]
-
blk.39.attn_q.weightQ3_K[8192 8192]
-
blk.39.attn_v.biasF32[1024]
-
blk.39.attn_v.weightQ3_K[8192 1024]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.39.ffn_norm.weightF32[8192]
-
blk.40.attn_norm.weightF32[8192]
-
blk.40.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.40.ffn_gate.weightQ3_K[8192 29568]
-
blk.40.ffn_up.weightQ3_K[8192 29568]
-
blk.40.ffn_norm.weightF32[8192]
-
blk.40.attn_k.biasF32[1024]
-
blk.40.attn_k.weightQ3_K[8192 1024]
-
blk.40.attn_output.weightQ3_K[8192 8192]
-
blk.40.attn_q.biasF32[8192]
-
blk.40.attn_q.weightQ3_K[8192 8192]
-
blk.40.attn_v.biasF32[1024]
-
blk.40.attn_v.weightQ3_K[8192 1024]
-
blk.41.attn_k.biasF32[1024]
-
blk.41.attn_k.weightQ3_K[8192 1024]
-
blk.41.attn_q.biasF32[8192]
-
blk.41.attn_q.weightQ3_K[8192 8192]
-
blk.41.attn_v.biasF32[1024]
-
blk.41.attn_v.weightQ3_K[8192 1024]
-
blk.41.attn_norm.weightF32[8192]
-
blk.41.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.41.ffn_gate.weightQ3_K[8192 29568]
-
blk.41.ffn_up.weightQ3_K[8192 29568]
-
blk.41.ffn_norm.weightF32[8192]
-
blk.41.attn_output.weightQ3_K[8192 8192]
-
blk.42.ffn_gate.weightQ3_K[8192 29568]
-
blk.42.attn_k.biasF32[1024]
-
blk.42.attn_k.weightQ3_K[8192 1024]
-
blk.42.attn_output.weightQ3_K[8192 8192]
-
blk.42.attn_q.biasF32[8192]
-
blk.42.attn_q.weightQ3_K[8192 8192]
-
blk.42.attn_v.biasF32[1024]
-
blk.42.attn_v.weightQ3_K[8192 1024]
-
blk.42.attn_norm.weightF32[8192]
-
blk.42.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.42.ffn_up.weightQ3_K[8192 29568]
-
blk.42.ffn_norm.weightF32[8192]
-
blk.43.ffn_gate.weightQ3_K[8192 29568]
-
blk.43.ffn_up.weightQ3_K[8192 29568]
-
blk.43.attn_k.biasF32[1024]
-
blk.43.attn_k.weightQ3_K[8192 1024]
-
blk.43.attn_output.weightQ3_K[8192 8192]
-
blk.43.attn_q.biasF32[8192]
-
blk.43.attn_q.weightQ3_K[8192 8192]
-
blk.43.attn_v.biasF32[1024]
-
blk.43.attn_v.weightQ3_K[8192 1024]
-
blk.43.attn_norm.weightF32[8192]
-
blk.43.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.43.ffn_norm.weightF32[8192]
-
blk.44.attn_norm.weightF32[8192]
-
blk.44.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.44.ffn_gate.weightQ3_K[8192 29568]
-
blk.44.ffn_up.weightQ3_K[8192 29568]
-
blk.44.ffn_norm.weightF32[8192]
-
blk.44.attn_k.biasF32[1024]
-
blk.44.attn_k.weightQ3_K[8192 1024]
-
blk.44.attn_output.weightQ3_K[8192 8192]
-
blk.44.attn_q.biasF32[8192]
-
blk.44.attn_q.weightQ3_K[8192 8192]
-
blk.44.attn_v.biasF32[1024]
-
blk.44.attn_v.weightQ3_K[8192 1024]
-
blk.45.attn_k.biasF32[1024]
-
blk.45.attn_k.weightQ3_K[8192 1024]
-
blk.45.attn_q.biasF32[8192]
-
blk.45.attn_q.weightQ3_K[8192 8192]
-
blk.45.attn_v.biasF32[1024]
-
blk.45.attn_v.weightQ3_K[8192 1024]
-
blk.45.attn_norm.weightF32[8192]
-
blk.45.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.45.ffn_gate.weightQ3_K[8192 29568]
-
blk.45.ffn_up.weightQ3_K[8192 29568]
-
blk.45.ffn_norm.weightF32[8192]
-
blk.45.attn_output.weightQ3_K[8192 8192]
-
blk.46.ffn_gate.weightQ3_K[8192 29568]
-
blk.46.attn_k.biasF32[1024]
-
blk.46.attn_k.weightQ3_K[8192 1024]
-
blk.46.attn_output.weightQ3_K[8192 8192]
-
blk.46.attn_q.biasF32[8192]
-
blk.46.attn_q.weightQ3_K[8192 8192]
-
blk.46.attn_v.biasF32[1024]
-
blk.46.attn_v.weightQ3_K[8192 1024]
-
blk.46.attn_norm.weightF32[8192]
-
blk.46.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.46.ffn_up.weightQ3_K[8192 29568]
-
blk.46.ffn_norm.weightF32[8192]
-
blk.47.ffn_gate.weightQ3_K[8192 29568]
-
blk.47.ffn_up.weightQ3_K[8192 29568]
-
blk.47.attn_k.biasF32[1024]
-
blk.47.attn_k.weightQ3_K[8192 1024]
-
blk.47.attn_output.weightQ3_K[8192 8192]
-
blk.47.attn_q.biasF32[8192]
-
blk.47.attn_q.weightQ3_K[8192 8192]
-
blk.47.attn_v.biasF32[1024]
-
blk.47.attn_v.weightQ3_K[8192 1024]
-
blk.47.attn_norm.weightF32[8192]
-
blk.47.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.47.ffn_norm.weightF32[8192]
-
blk.48.attn_norm.weightF32[8192]
-
blk.48.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.48.ffn_gate.weightQ3_K[8192 29568]
-
blk.48.ffn_up.weightQ3_K[8192 29568]
-
blk.48.ffn_norm.weightF32[8192]
-
blk.48.attn_k.biasF32[1024]
-
blk.48.attn_k.weightQ3_K[8192 1024]
-
blk.48.attn_output.weightQ3_K[8192 8192]
-
blk.48.attn_q.biasF32[8192]
-
blk.48.attn_q.weightQ3_K[8192 8192]
-
blk.48.attn_v.biasF32[1024]
-
blk.48.attn_v.weightQ3_K[8192 1024]
-
blk.49.attn_k.biasF32[1024]
-
blk.49.attn_k.weightQ3_K[8192 1024]
-
blk.49.attn_q.biasF32[8192]
-
blk.49.attn_q.weightQ3_K[8192 8192]
-
blk.49.attn_v.biasF32[1024]
-
blk.49.attn_v.weightQ3_K[8192 1024]
-
blk.49.attn_norm.weightF32[8192]
-
blk.49.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.49.ffn_gate.weightQ3_K[8192 29568]
-
blk.49.ffn_up.weightQ3_K[8192 29568]
-
blk.49.ffn_norm.weightF32[8192]
-
blk.49.attn_output.weightQ3_K[8192 8192]
-
blk.50.ffn_gate.weightQ3_K[8192 29568]
-
blk.50.attn_k.biasF32[1024]
-
blk.50.attn_k.weightQ3_K[8192 1024]
-
blk.50.attn_output.weightQ3_K[8192 8192]
-
blk.50.attn_q.biasF32[8192]
-
blk.50.attn_q.weightQ3_K[8192 8192]
-
blk.50.attn_v.biasF32[1024]
-
blk.50.attn_v.weightQ3_K[8192 1024]
-
blk.50.attn_norm.weightF32[8192]
-
blk.50.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.50.ffn_up.weightQ3_K[8192 29568]
-
blk.50.ffn_norm.weightF32[8192]
-
blk.51.ffn_gate.weightQ3_K[8192 29568]
-
blk.51.ffn_up.weightQ3_K[8192 29568]
-
blk.51.attn_k.biasF32[1024]
-
blk.51.attn_k.weightQ3_K[8192 1024]
-
blk.51.attn_output.weightQ3_K[8192 8192]
-
blk.51.attn_q.biasF32[8192]
-
blk.51.attn_q.weightQ3_K[8192 8192]
-
blk.51.attn_v.biasF32[1024]
-
blk.51.attn_v.weightQ3_K[8192 1024]
-
blk.51.attn_norm.weightF32[8192]
-
blk.51.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.51.ffn_norm.weightF32[8192]
-
blk.52.attn_norm.weightF32[8192]
-
blk.52.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.52.ffn_gate.weightQ3_K[8192 29568]
-
blk.52.ffn_up.weightQ3_K[8192 29568]
-
blk.52.ffn_norm.weightF32[8192]
-
blk.52.attn_k.biasF32[1024]
-
blk.52.attn_k.weightQ3_K[8192 1024]
-
blk.52.attn_output.weightQ3_K[8192 8192]
-
blk.52.attn_q.biasF32[8192]
-
blk.52.attn_q.weightQ3_K[8192 8192]
-
blk.52.attn_v.biasF32[1024]
-
blk.52.attn_v.weightQ3_K[8192 1024]
-
blk.53.attn_k.biasF32[1024]
-
blk.53.attn_k.weightQ3_K[8192 1024]
-
blk.53.attn_q.biasF32[8192]
-
blk.53.attn_q.weightQ3_K[8192 8192]
-
blk.53.attn_v.biasF32[1024]
-
blk.53.attn_v.weightQ3_K[8192 1024]
-
blk.53.attn_norm.weightF32[8192]
-
blk.53.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.53.ffn_gate.weightQ3_K[8192 29568]
-
blk.53.ffn_up.weightQ3_K[8192 29568]
-
blk.53.ffn_norm.weightF32[8192]
-
blk.53.attn_output.weightQ3_K[8192 8192]
-
blk.54.ffn_gate.weightQ3_K[8192 29568]
-
blk.54.attn_k.biasF32[1024]
-
blk.54.attn_k.weightQ3_K[8192 1024]
-
blk.54.attn_output.weightQ3_K[8192 8192]
-
blk.54.attn_q.biasF32[8192]
-
blk.54.attn_q.weightQ3_K[8192 8192]
-
blk.54.attn_v.biasF32[1024]
-
blk.54.attn_v.weightQ3_K[8192 1024]
-
blk.54.attn_norm.weightF32[8192]
-
blk.54.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.54.ffn_up.weightQ3_K[8192 29568]
-
blk.54.ffn_norm.weightF32[8192]
-
blk.55.ffn_gate.weightQ3_K[8192 29568]
-
blk.55.ffn_up.weightQ3_K[8192 29568]
-
blk.55.attn_k.biasF32[1024]
-
blk.55.attn_k.weightQ3_K[8192 1024]
-
blk.55.attn_output.weightQ3_K[8192 8192]
-
blk.55.attn_q.biasF32[8192]
-
blk.55.attn_q.weightQ3_K[8192 8192]
-
blk.55.attn_v.biasF32[1024]
-
blk.55.attn_v.weightQ3_K[8192 1024]
-
blk.55.attn_norm.weightF32[8192]
-
blk.55.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.55.ffn_norm.weightF32[8192]
-
blk.56.attn_norm.weightF32[8192]
-
blk.56.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.56.ffn_gate.weightQ3_K[8192 29568]
-
blk.56.ffn_up.weightQ3_K[8192 29568]
-
blk.56.ffn_norm.weightF32[8192]
-
blk.56.attn_k.biasF32[1024]
-
blk.56.attn_k.weightQ3_K[8192 1024]
-
blk.56.attn_output.weightQ3_K[8192 8192]
-
blk.56.attn_q.biasF32[8192]
-
blk.56.attn_q.weightQ3_K[8192 8192]
-
blk.56.attn_v.biasF32[1024]
-
blk.56.attn_v.weightQ3_K[8192 1024]
-
blk.57.attn_k.biasF32[1024]
-
blk.57.attn_k.weightQ3_K[8192 1024]
-
blk.57.attn_q.biasF32[8192]
-
blk.57.attn_q.weightQ3_K[8192 8192]
-
blk.57.attn_v.biasF32[1024]
-
blk.57.attn_v.weightQ3_K[8192 1024]
-
blk.57.attn_norm.weightF32[8192]
-
blk.57.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.57.ffn_gate.weightQ3_K[8192 29568]
-
blk.57.ffn_up.weightQ3_K[8192 29568]
-
blk.57.ffn_norm.weightF32[8192]
-
blk.57.attn_output.weightQ3_K[8192 8192]
-
blk.58.ffn_gate.weightQ3_K[8192 29568]
-
blk.58.attn_k.biasF32[1024]
-
blk.58.attn_k.weightQ3_K[8192 1024]
-
blk.58.attn_output.weightQ3_K[8192 8192]
-
blk.58.attn_q.biasF32[8192]
-
blk.58.attn_q.weightQ3_K[8192 8192]
-
blk.58.attn_v.biasF32[1024]
-
blk.58.attn_v.weightQ3_K[8192 1024]
-
blk.58.attn_norm.weightF32[8192]
-
blk.58.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.58.ffn_up.weightQ3_K[8192 29568]
-
blk.58.ffn_norm.weightF32[8192]
-
blk.59.ffn_gate.weightQ3_K[8192 29568]
-
blk.59.ffn_up.weightQ3_K[8192 29568]
-
blk.59.attn_k.biasF32[1024]
-
blk.59.attn_k.weightQ3_K[8192 1024]
-
blk.59.attn_output.weightQ3_K[8192 8192]
-
blk.59.attn_q.biasF32[8192]
-
blk.59.attn_q.weightQ3_K[8192 8192]
-
blk.59.attn_v.biasF32[1024]
-
blk.59.attn_v.weightQ3_K[8192 1024]
-
blk.59.attn_norm.weightF32[8192]
-
blk.59.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.59.ffn_norm.weightF32[8192]
-
blk.60.attn_norm.weightF32[8192]
-
blk.60.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.60.ffn_gate.weightQ3_K[8192 29568]
-
blk.60.ffn_up.weightQ3_K[8192 29568]
-
blk.60.ffn_norm.weightF32[8192]
-
blk.60.attn_k.biasF32[1024]
-
blk.60.attn_k.weightQ3_K[8192 1024]
-
blk.60.attn_output.weightQ3_K[8192 8192]
-
blk.60.attn_q.biasF32[8192]
-
blk.60.attn_q.weightQ3_K[8192 8192]
-
blk.60.attn_v.biasF32[1024]
-
blk.60.attn_v.weightQ3_K[8192 1024]
-
blk.61.attn_k.biasF32[1024]
-
blk.61.attn_k.weightQ3_K[8192 1024]
-
blk.61.attn_q.biasF32[8192]
-
blk.61.attn_q.weightQ3_K[8192 8192]
-
blk.61.attn_v.biasF32[1024]
-
blk.61.attn_v.weightQ3_K[8192 1024]
-
blk.61.attn_norm.weightF32[8192]
-
blk.61.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.61.ffn_gate.weightQ3_K[8192 29568]
-
blk.61.ffn_up.weightQ3_K[8192 29568]
-
blk.61.ffn_norm.weightF32[8192]
-
blk.61.attn_output.weightQ3_K[8192 8192]
-
blk.62.ffn_gate.weightQ3_K[8192 29568]
-
blk.62.attn_k.biasF32[1024]
-
blk.62.attn_k.weightQ3_K[8192 1024]
-
blk.62.attn_output.weightQ3_K[8192 8192]
-
blk.62.attn_q.biasF32[8192]
-
blk.62.attn_q.weightQ3_K[8192 8192]
-
blk.62.attn_v.biasF32[1024]
-
blk.62.attn_v.weightQ3_K[8192 1024]
-
blk.62.attn_norm.weightF32[8192]
-
blk.62.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.62.ffn_up.weightQ3_K[8192 29568]
-
blk.62.ffn_norm.weightF32[8192]
-
blk.63.ffn_gate.weightQ3_K[8192 29568]
-
blk.63.ffn_up.weightQ3_K[8192 29568]
-
blk.63.attn_k.biasF32[1024]
-
blk.63.attn_k.weightQ3_K[8192 1024]
-
blk.63.attn_output.weightQ3_K[8192 8192]
-
blk.63.attn_q.biasF32[8192]
-
blk.63.attn_q.weightQ3_K[8192 8192]
-
blk.63.attn_v.biasF32[1024]
-
blk.63.attn_v.weightQ3_K[8192 1024]
-
blk.63.attn_norm.weightF32[8192]
-
blk.63.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.63.ffn_norm.weightF32[8192]
-
blk.64.attn_norm.weightF32[8192]
-
blk.64.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.64.ffn_gate.weightQ3_K[8192 29568]
-
blk.64.ffn_up.weightQ3_K[8192 29568]
-
blk.64.ffn_norm.weightF32[8192]
-
blk.64.attn_k.biasF32[1024]
-
blk.64.attn_k.weightQ3_K[8192 1024]
-
blk.64.attn_output.weightQ3_K[8192 8192]
-
blk.64.attn_q.biasF32[8192]
-
blk.64.attn_q.weightQ3_K[8192 8192]
-
blk.64.attn_v.biasF32[1024]
-
blk.64.attn_v.weightQ3_K[8192 1024]
-
blk.65.attn_k.biasF32[1024]
-
blk.65.attn_k.weightQ3_K[8192 1024]
-
blk.65.attn_q.biasF32[8192]
-
blk.65.attn_q.weightQ3_K[8192 8192]
-
blk.65.attn_v.biasF32[1024]
-
blk.65.attn_v.weightQ3_K[8192 1024]
-
blk.65.attn_norm.weightF32[8192]
-
blk.65.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.65.ffn_gate.weightQ3_K[8192 29568]
-
blk.65.ffn_up.weightQ3_K[8192 29568]
-
blk.65.ffn_norm.weightF32[8192]
-
blk.65.attn_output.weightQ3_K[8192 8192]
-
blk.66.ffn_gate.weightQ3_K[8192 29568]
-
blk.66.attn_k.biasF32[1024]
-
blk.66.attn_k.weightQ3_K[8192 1024]
-
blk.66.attn_output.weightQ3_K[8192 8192]
-
blk.66.attn_q.biasF32[8192]
-
blk.66.attn_q.weightQ3_K[8192 8192]
-
blk.66.attn_v.biasF32[1024]
-
blk.66.attn_v.weightQ3_K[8192 1024]
-
blk.66.attn_norm.weightF32[8192]
-
blk.66.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.66.ffn_up.weightQ3_K[8192 29568]
-
blk.66.ffn_norm.weightF32[8192]
-
blk.67.ffn_gate.weightQ3_K[8192 29568]
-
blk.67.ffn_up.weightQ3_K[8192 29568]
-
blk.67.attn_k.biasF32[1024]
-
blk.67.attn_k.weightQ3_K[8192 1024]
-
blk.67.attn_output.weightQ3_K[8192 8192]
-
blk.67.attn_q.biasF32[8192]
-
blk.67.attn_q.weightQ3_K[8192 8192]
-
blk.67.attn_v.biasF32[1024]
-
blk.67.attn_v.weightQ3_K[8192 1024]
-
blk.67.attn_norm.weightF32[8192]
-
blk.67.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.67.ffn_norm.weightF32[8192]
-
blk.68.attn_norm.weightF32[8192]
-
blk.68.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.68.ffn_gate.weightQ3_K[8192 29568]
-
blk.68.ffn_up.weightQ3_K[8192 29568]
-
blk.68.ffn_norm.weightF32[8192]
-
blk.68.attn_k.biasF32[1024]
-
blk.68.attn_k.weightQ3_K[8192 1024]
-
blk.68.attn_output.weightQ3_K[8192 8192]
-
blk.68.attn_q.biasF32[8192]
-
blk.68.attn_q.weightQ3_K[8192 8192]
-
blk.68.attn_v.biasF32[1024]
-
blk.68.attn_v.weightQ3_K[8192 1024]
-
blk.69.attn_k.biasF32[1024]
-
blk.69.attn_k.weightQ3_K[8192 1024]
-
blk.69.attn_q.biasF32[8192]
-
blk.69.attn_q.weightQ3_K[8192 8192]
-
blk.69.attn_v.biasF32[1024]
-
blk.69.attn_v.weightQ3_K[8192 1024]
-
blk.69.attn_norm.weightF32[8192]
-
blk.69.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.69.ffn_gate.weightQ3_K[8192 29568]
-
blk.69.ffn_up.weightQ3_K[8192 29568]
-
blk.69.ffn_norm.weightF32[8192]
-
blk.69.attn_output.weightQ3_K[8192 8192]
-
blk.70.ffn_gate.weightQ3_K[8192 29568]
-
blk.70.attn_k.biasF32[1024]
-
blk.70.attn_k.weightQ3_K[8192 1024]
-
blk.70.attn_output.weightQ3_K[8192 8192]
-
blk.70.attn_q.biasF32[8192]
-
blk.70.attn_q.weightQ3_K[8192 8192]
-
blk.70.attn_v.biasF32[1024]
-
blk.70.attn_v.weightQ3_K[8192 1024]
-
blk.70.attn_norm.weightF32[8192]
-
blk.70.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.70.ffn_up.weightQ3_K[8192 29568]
-
blk.70.ffn_norm.weightF32[8192]
-
blk.71.ffn_gate.weightQ3_K[8192 29568]
-
blk.71.ffn_up.weightQ3_K[8192 29568]
-
blk.71.attn_k.biasF32[1024]
-
blk.71.attn_k.weightQ3_K[8192 1024]
-
blk.71.attn_output.weightQ3_K[8192 8192]
-
blk.71.attn_q.biasF32[8192]
-
blk.71.attn_q.weightQ3_K[8192 8192]
-
blk.71.attn_v.biasF32[1024]
-
blk.71.attn_v.weightQ3_K[8192 1024]
-
blk.71.attn_norm.weightF32[8192]
-
blk.71.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.71.ffn_norm.weightF32[8192]
-
blk.72.attn_norm.weightF32[8192]
-
blk.72.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.72.ffn_gate.weightQ3_K[8192 29568]
-
blk.72.ffn_up.weightQ3_K[8192 29568]
-
blk.72.ffn_norm.weightF32[8192]
-
blk.72.attn_k.biasF32[1024]
-
blk.72.attn_k.weightQ3_K[8192 1024]
-
blk.72.attn_output.weightQ3_K[8192 8192]
-
blk.72.attn_q.biasF32[8192]
-
blk.72.attn_q.weightQ3_K[8192 8192]
-
blk.72.attn_v.biasF32[1024]
-
blk.72.attn_v.weightQ3_K[8192 1024]
-
blk.73.attn_k.biasF32[1024]
-
blk.73.attn_k.weightQ3_K[8192 1024]
-
blk.73.attn_q.biasF32[8192]
-
blk.73.attn_q.weightQ3_K[8192 8192]
-
blk.73.attn_v.biasF32[1024]
-
blk.73.attn_v.weightQ3_K[8192 1024]
-
blk.73.attn_norm.weightF32[8192]
-
blk.73.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.73.ffn_gate.weightQ3_K[8192 29568]
-
blk.73.ffn_up.weightQ3_K[8192 29568]
-
blk.73.ffn_norm.weightF32[8192]
-
blk.73.attn_output.weightQ3_K[8192 8192]
-
blk.74.ffn_gate.weightQ3_K[8192 29568]
-
blk.74.attn_k.biasF32[1024]
-
blk.74.attn_k.weightQ3_K[8192 1024]
-
blk.74.attn_output.weightQ3_K[8192 8192]
-
blk.74.attn_q.biasF32[8192]
-
blk.74.attn_q.weightQ3_K[8192 8192]
-
blk.74.attn_v.biasF32[1024]
-
blk.74.attn_v.weightQ3_K[8192 1024]
-
blk.74.attn_norm.weightF32[8192]
-
blk.74.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.74.ffn_up.weightQ3_K[8192 29568]
-
blk.74.ffn_norm.weightF32[8192]
-
blk.75.ffn_gate.weightQ3_K[8192 29568]
-
blk.75.ffn_up.weightQ3_K[8192 29568]
-
blk.75.attn_k.biasF32[1024]
-
blk.75.attn_k.weightQ3_K[8192 1024]
-
blk.75.attn_output.weightQ3_K[8192 8192]
-
blk.75.attn_q.biasF32[8192]
-
blk.75.attn_q.weightQ3_K[8192 8192]
-
blk.75.attn_v.biasF32[1024]
-
blk.75.attn_v.weightQ3_K[8192 1024]
-
blk.75.attn_norm.weightF32[8192]
-
blk.75.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.75.ffn_norm.weightF32[8192]
-
blk.76.attn_norm.weightF32[8192]
-
blk.76.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.76.ffn_gate.weightQ3_K[8192 29568]
-
blk.76.ffn_up.weightQ3_K[8192 29568]
-
blk.76.ffn_norm.weightF32[8192]
-
blk.76.attn_k.biasF32[1024]
-
blk.76.attn_k.weightQ3_K[8192 1024]
-
blk.76.attn_output.weightQ3_K[8192 8192]
-
blk.76.attn_q.biasF32[8192]
-
blk.76.attn_q.weightQ3_K[8192 8192]
-
blk.76.attn_v.biasF32[1024]
-
blk.76.attn_v.weightQ3_K[8192 1024]
-
blk.77.attn_k.biasF32[1024]
-
blk.77.attn_k.weightQ3_K[8192 1024]
-
blk.77.attn_q.biasF32[8192]
-
blk.77.attn_q.weightQ3_K[8192 8192]
-
blk.77.attn_v.biasF32[1024]
-
blk.77.attn_v.weightQ3_K[8192 1024]
-
blk.77.attn_norm.weightF32[8192]
-
blk.77.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.77.ffn_gate.weightQ3_K[8192 29568]
-
blk.77.ffn_up.weightQ3_K[8192 29568]
-
blk.77.ffn_norm.weightF32[8192]
-
blk.77.attn_output.weightQ3_K[8192 8192]
-
blk.78.ffn_gate.weightQ3_K[8192 29568]
-
blk.78.attn_k.biasF32[1024]
-
blk.78.attn_k.weightQ3_K[8192 1024]
-
blk.78.attn_output.weightQ3_K[8192 8192]
-
blk.78.attn_q.biasF32[8192]
-
blk.78.attn_q.weightQ3_K[8192 8192]
-
blk.78.attn_v.biasF32[1024]
-
blk.78.attn_v.weightQ3_K[8192 1024]
-
blk.78.attn_norm.weightF32[8192]
-
blk.78.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.78.ffn_up.weightQ3_K[8192 29568]
-
blk.78.ffn_norm.weightF32[8192]
-
blk.79.ffn_gate.weightQ3_K[8192 29568]
-
blk.79.ffn_up.weightQ3_K[8192 29568]
-
blk.79.attn_k.biasF32[1024]
-
blk.79.attn_k.weightQ3_K[8192 1024]
-
blk.79.attn_output.weightQ3_K[8192 8192]
-
blk.79.attn_q.biasF32[8192]
-
blk.79.attn_q.weightQ3_K[8192 8192]
-
blk.79.attn_v.biasF32[1024]
-
blk.79.attn_v.weightQ3_K[8192 1024]
-
blk.79.attn_norm.weightF32[8192]
-
blk.79.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.79.ffn_norm.weightF32[8192]
-
blk.80.attn_norm.weightF32[8192]
-
blk.80.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.80.ffn_gate.weightQ3_K[8192 29568]
-
blk.80.ffn_up.weightQ3_K[8192 29568]
-
blk.80.ffn_norm.weightF32[8192]
-
blk.80.attn_k.biasF32[1024]
-
blk.80.attn_k.weightQ3_K[8192 1024]
-
blk.80.attn_output.weightQ3_K[8192 8192]
-
blk.80.attn_q.biasF32[8192]
-
blk.80.attn_q.weightQ3_K[8192 8192]
-
blk.80.attn_v.biasF32[1024]
-
blk.80.attn_v.weightQ3_K[8192 1024]
-
blk.81.attn_k.biasF32[1024]
-
blk.81.attn_k.weightQ3_K[8192 1024]
-
blk.81.attn_q.biasF32[8192]
-
blk.81.attn_q.weightQ3_K[8192 8192]
-
blk.81.attn_v.biasF32[1024]
-
blk.81.attn_v.weightQ3_K[8192 1024]
-
blk.81.attn_norm.weightF32[8192]
-
blk.81.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.81.ffn_gate.weightQ3_K[8192 29568]
-
blk.81.ffn_up.weightQ3_K[8192 29568]
-
blk.81.ffn_norm.weightF32[8192]
-
blk.81.attn_output.weightQ3_K[8192 8192]
-
blk.82.ffn_gate.weightQ3_K[8192 29568]
-
blk.82.attn_k.biasF32[1024]
-
blk.82.attn_k.weightQ3_K[8192 1024]
-
blk.82.attn_output.weightQ3_K[8192 8192]
-
blk.82.attn_q.biasF32[8192]
-
blk.82.attn_q.weightQ3_K[8192 8192]
-
blk.82.attn_v.biasF32[1024]
-
blk.82.attn_v.weightQ3_K[8192 1024]
-
blk.82.attn_norm.weightF32[8192]
-
blk.82.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.82.ffn_up.weightQ3_K[8192 29568]
-
blk.82.ffn_norm.weightF32[8192]
-
blk.83.ffn_gate.weightQ3_K[8192 29568]
-
blk.83.ffn_up.weightQ3_K[8192 29568]
-
blk.83.attn_k.biasF32[1024]
-
blk.83.attn_k.weightQ3_K[8192 1024]
-
blk.83.attn_output.weightQ3_K[8192 8192]
-
blk.83.attn_q.biasF32[8192]
-
blk.83.attn_q.weightQ3_K[8192 8192]
-
blk.83.attn_v.biasF32[1024]
-
blk.83.attn_v.weightQ3_K[8192 1024]
-
blk.83.attn_norm.weightF32[8192]
-
blk.83.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.83.ffn_norm.weightF32[8192]
-
blk.84.attn_norm.weightF32[8192]
-
blk.84.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.84.ffn_gate.weightQ3_K[8192 29568]
-
blk.84.ffn_up.weightQ3_K[8192 29568]
-
blk.84.ffn_norm.weightF32[8192]
-
blk.84.attn_k.biasF32[1024]
-
blk.84.attn_k.weightQ3_K[8192 1024]
-
blk.84.attn_output.weightQ3_K[8192 8192]
-
blk.84.attn_q.biasF32[8192]
-
blk.84.attn_q.weightQ3_K[8192 8192]
-
blk.84.attn_v.biasF32[1024]
-
blk.84.attn_v.weightQ3_K[8192 1024]
-
blk.85.attn_k.biasF32[1024]
-
blk.85.attn_k.weightQ3_K[8192 1024]
-
blk.85.attn_q.biasF32[8192]
-
blk.85.attn_q.weightQ3_K[8192 8192]
-
blk.85.attn_v.biasF32[1024]
-
blk.85.attn_v.weightQ3_K[8192 1024]
-
blk.85.attn_norm.weightF32[8192]
-
blk.85.ffn_down.weight(!unknown_type 20!)[29568 8192]
-
blk.85.ffn_gate.weightQ3_K[8192 29568]
-
blk.85.ffn_up.weightQ3_K[8192 29568]
-
blk.85.ffn_norm.weightF32[8192]
-
blk.85.attn_output.weightQ3_K[8192 8192]
-
output_norm.weightF32[8192]
-
output.weightQ6_K[8192 151646]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63
blk.64
blk.65
blk.66
blk.67
blk.68
blk.69
blk.70
blk.71
blk.72
blk.73
blk.74
blk.75
blk.76
blk.77
blk.78
blk.79
blk.80
blk.81
blk.82
blk.83
blk.84
blk.85