An RP model with impressive flexibility.
27B
59 Pulls Updated 7 weeks ago
ce3ad0aa7352 · 22GB
-
general.architecturegemma2
-
general.file_typeQ6_K
-
gemma2.attention.head_count32
-
gemma2.attention.head_count_kv16
-
gemma2.attention.key_length128
-
gemma2.attention.layer_norm_rms_epsilon1e-06
-
gemma2.attention.sliding_window4096
-
gemma2.attention.value_length128
-
gemma2.attn_logit_softcapping50
-
gemma2.block_count46
-
gemma2.context_length8192
-
gemma2.embedding_length4608
-
gemma2.feed_forward_length36864
-
gemma2.final_logit_softcapping30
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixfalse
-
tokenizer.ggml.bos_token_id2
-
tokenizer.ggml.eos_token_id1
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id0
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000 -1000 -1000 -1000 -1000 ...]
-
tokenizer.ggml.token_type[3 3 3 3 3 ...]
-
tokenizer.ggml.tokens[<pad> <eos> <bos> <unk> <mask> ...]
-
tokenizer.ggml.unknown_token_id3
-
NameTypeShape
-
token_embd.weightQ6_K[4608 256000]
-
blk.0.attn_norm.weightF32[4608]
-
blk.0.ffn_down.weightQ6_K[36864 4608]
-
blk.0.ffn_gate.weightQ6_K[4608 36864]
-
blk.0.ffn_up.weightQ6_K[4608 36864]
-
blk.0.post_attention_norm.weightF32[4608]
-
blk.0.post_ffw_norm.weightF32[4608]
-
blk.0.ffn_norm.weightF32[4608]
-
blk.0.attn_k.weightQ6_K[4608 2048]
-
blk.0.attn_output.weightQ6_K[4096 4608]
-
blk.0.attn_q.weightQ6_K[4608 4096]
-
blk.0.attn_v.weightQ6_K[4608 2048]
-
blk.1.attn_norm.weightF32[4608]
-
blk.1.ffn_down.weightQ6_K[36864 4608]
-
blk.1.ffn_gate.weightQ6_K[4608 36864]
-
blk.1.ffn_up.weightQ6_K[4608 36864]
-
blk.1.post_attention_norm.weightF32[4608]
-
blk.1.post_ffw_norm.weightF32[4608]
-
blk.1.ffn_norm.weightF32[4608]
-
blk.1.attn_k.weightQ6_K[4608 2048]
-
blk.1.attn_output.weightQ6_K[4096 4608]
-
blk.1.attn_q.weightQ6_K[4608 4096]
-
blk.1.attn_v.weightQ6_K[4608 2048]
-
blk.2.attn_norm.weightF32[4608]
-
blk.2.ffn_down.weightQ6_K[36864 4608]
-
blk.2.ffn_gate.weightQ6_K[4608 36864]
-
blk.2.ffn_up.weightQ6_K[4608 36864]
-
blk.2.post_attention_norm.weightF32[4608]
-
blk.2.post_ffw_norm.weightF32[4608]
-
blk.2.ffn_norm.weightF32[4608]
-
blk.2.attn_k.weightQ6_K[4608 2048]
-
blk.2.attn_output.weightQ6_K[4096 4608]
-
blk.2.attn_q.weightQ6_K[4608 4096]
-
blk.2.attn_v.weightQ6_K[4608 2048]
-
blk.3.attn_norm.weightF32[4608]
-
blk.3.ffn_down.weightQ6_K[36864 4608]
-
blk.3.ffn_gate.weightQ6_K[4608 36864]
-
blk.3.ffn_up.weightQ6_K[4608 36864]
-
blk.3.post_attention_norm.weightF32[4608]
-
blk.3.post_ffw_norm.weightF32[4608]
-
blk.3.ffn_norm.weightF32[4608]
-
blk.3.attn_k.weightQ6_K[4608 2048]
-
blk.3.attn_output.weightQ6_K[4096 4608]
-
blk.3.attn_q.weightQ6_K[4608 4096]
-
blk.3.attn_v.weightQ6_K[4608 2048]
-
blk.4.attn_norm.weightF32[4608]
-
blk.4.ffn_down.weightQ6_K[36864 4608]
-
blk.4.ffn_gate.weightQ6_K[4608 36864]
-
blk.4.ffn_up.weightQ6_K[4608 36864]
-
blk.4.post_attention_norm.weightF32[4608]
-
blk.4.post_ffw_norm.weightF32[4608]
-
blk.4.ffn_norm.weightF32[4608]
-
blk.4.attn_k.weightQ6_K[4608 2048]
-
blk.4.attn_output.weightQ6_K[4096 4608]
-
blk.4.attn_q.weightQ6_K[4608 4096]
-
blk.4.attn_v.weightQ6_K[4608 2048]
-
blk.5.attn_norm.weightF32[4608]
-
blk.5.ffn_down.weightQ6_K[36864 4608]
-
blk.5.ffn_gate.weightQ6_K[4608 36864]
-
blk.5.ffn_up.weightQ6_K[4608 36864]
-
blk.5.post_attention_norm.weightF32[4608]
-
blk.5.post_ffw_norm.weightF32[4608]
-
blk.5.ffn_norm.weightF32[4608]
-
blk.5.attn_k.weightQ6_K[4608 2048]
-
blk.5.attn_output.weightQ6_K[4096 4608]
-
blk.5.attn_q.weightQ6_K[4608 4096]
-
blk.5.attn_v.weightQ6_K[4608 2048]
-
blk.6.attn_norm.weightF32[4608]
-
blk.6.ffn_down.weightQ6_K[36864 4608]
-
blk.6.ffn_gate.weightQ6_K[4608 36864]
-
blk.6.ffn_up.weightQ6_K[4608 36864]
-
blk.6.post_attention_norm.weightF32[4608]
-
blk.6.post_ffw_norm.weightF32[4608]
-
blk.6.ffn_norm.weightF32[4608]
-
blk.6.attn_k.weightQ6_K[4608 2048]
-
blk.6.attn_output.weightQ6_K[4096 4608]
-
blk.6.attn_q.weightQ6_K[4608 4096]
-
blk.6.attn_v.weightQ6_K[4608 2048]
-
blk.7.attn_norm.weightF32[4608]
-
blk.7.ffn_down.weightQ6_K[36864 4608]
-
blk.7.ffn_gate.weightQ6_K[4608 36864]
-
blk.7.ffn_up.weightQ6_K[4608 36864]
-
blk.7.post_attention_norm.weightF32[4608]
-
blk.7.post_ffw_norm.weightF32[4608]
-
blk.7.ffn_norm.weightF32[4608]
-
blk.7.attn_k.weightQ6_K[4608 2048]
-
blk.7.attn_output.weightQ6_K[4096 4608]
-
blk.7.attn_q.weightQ6_K[4608 4096]
-
blk.7.attn_v.weightQ6_K[4608 2048]
-
blk.8.attn_norm.weightF32[4608]
-
blk.8.ffn_down.weightQ6_K[36864 4608]
-
blk.8.ffn_gate.weightQ6_K[4608 36864]
-
blk.8.ffn_up.weightQ6_K[4608 36864]
-
blk.8.post_attention_norm.weightF32[4608]
-
blk.8.post_ffw_norm.weightF32[4608]
-
blk.8.ffn_norm.weightF32[4608]
-
blk.8.attn_k.weightQ6_K[4608 2048]
-
blk.8.attn_output.weightQ6_K[4096 4608]
-
blk.8.attn_q.weightQ6_K[4608 4096]
-
blk.8.attn_v.weightQ6_K[4608 2048]
-
blk.9.attn_norm.weightF32[4608]
-
blk.9.ffn_down.weightQ6_K[36864 4608]
-
blk.9.ffn_gate.weightQ6_K[4608 36864]
-
blk.9.ffn_up.weightQ6_K[4608 36864]
-
blk.9.post_attention_norm.weightF32[4608]
-
blk.9.post_ffw_norm.weightF32[4608]
-
blk.9.ffn_norm.weightF32[4608]
-
blk.9.attn_k.weightQ6_K[4608 2048]
-
blk.9.attn_output.weightQ6_K[4096 4608]
-
blk.9.attn_q.weightQ6_K[4608 4096]
-
blk.9.attn_v.weightQ6_K[4608 2048]
-
blk.10.attn_norm.weightF32[4608]
-
blk.10.ffn_down.weightQ6_K[36864 4608]
-
blk.10.ffn_gate.weightQ6_K[4608 36864]
-
blk.10.ffn_up.weightQ6_K[4608 36864]
-
blk.10.post_attention_norm.weightF32[4608]
-
blk.10.post_ffw_norm.weightF32[4608]
-
blk.10.ffn_norm.weightF32[4608]
-
blk.10.attn_k.weightQ6_K[4608 2048]
-
blk.10.attn_output.weightQ6_K[4096 4608]
-
blk.10.attn_q.weightQ6_K[4608 4096]
-
blk.10.attn_v.weightQ6_K[4608 2048]
-
blk.11.attn_norm.weightF32[4608]
-
blk.11.ffn_down.weightQ6_K[36864 4608]
-
blk.11.ffn_gate.weightQ6_K[4608 36864]
-
blk.11.ffn_up.weightQ6_K[4608 36864]
-
blk.11.post_attention_norm.weightF32[4608]
-
blk.11.post_ffw_norm.weightF32[4608]
-
blk.11.ffn_norm.weightF32[4608]
-
blk.11.attn_k.weightQ6_K[4608 2048]
-
blk.11.attn_output.weightQ6_K[4096 4608]
-
blk.11.attn_q.weightQ6_K[4608 4096]
-
blk.11.attn_v.weightQ6_K[4608 2048]
-
blk.12.attn_norm.weightF32[4608]
-
blk.12.ffn_down.weightQ6_K[36864 4608]
-
blk.12.ffn_gate.weightQ6_K[4608 36864]
-
blk.12.ffn_up.weightQ6_K[4608 36864]
-
blk.12.post_attention_norm.weightF32[4608]
-
blk.12.post_ffw_norm.weightF32[4608]
-
blk.12.ffn_norm.weightF32[4608]
-
blk.12.attn_k.weightQ6_K[4608 2048]
-
blk.12.attn_output.weightQ6_K[4096 4608]
-
blk.12.attn_q.weightQ6_K[4608 4096]
-
blk.12.attn_v.weightQ6_K[4608 2048]
-
blk.13.attn_norm.weightF32[4608]
-
blk.13.ffn_down.weightQ6_K[36864 4608]
-
blk.13.ffn_gate.weightQ6_K[4608 36864]
-
blk.13.ffn_up.weightQ6_K[4608 36864]
-
blk.13.post_attention_norm.weightF32[4608]
-
blk.13.post_ffw_norm.weightF32[4608]
-
blk.13.ffn_norm.weightF32[4608]
-
blk.13.attn_k.weightQ6_K[4608 2048]
-
blk.13.attn_output.weightQ6_K[4096 4608]
-
blk.13.attn_q.weightQ6_K[4608 4096]
-
blk.13.attn_v.weightQ6_K[4608 2048]
-
blk.14.attn_norm.weightF32[4608]
-
blk.14.ffn_down.weightQ6_K[36864 4608]
-
blk.14.ffn_gate.weightQ6_K[4608 36864]
-
blk.14.ffn_up.weightQ6_K[4608 36864]
-
blk.14.post_attention_norm.weightF32[4608]
-
blk.14.post_ffw_norm.weightF32[4608]
-
blk.14.ffn_norm.weightF32[4608]
-
blk.14.attn_k.weightQ6_K[4608 2048]
-
blk.14.attn_output.weightQ6_K[4096 4608]
-
blk.14.attn_q.weightQ6_K[4608 4096]
-
blk.14.attn_v.weightQ6_K[4608 2048]
-
blk.15.attn_norm.weightF32[4608]
-
blk.15.ffn_down.weightQ6_K[36864 4608]
-
blk.15.ffn_gate.weightQ6_K[4608 36864]
-
blk.15.ffn_up.weightQ6_K[4608 36864]
-
blk.15.post_attention_norm.weightF32[4608]
-
blk.15.post_ffw_norm.weightF32[4608]
-
blk.15.ffn_norm.weightF32[4608]
-
blk.15.attn_k.weightQ6_K[4608 2048]
-
blk.15.attn_output.weightQ6_K[4096 4608]
-
blk.15.attn_q.weightQ6_K[4608 4096]
-
blk.15.attn_v.weightQ6_K[4608 2048]
-
blk.16.attn_norm.weightF32[4608]
-
blk.16.ffn_down.weightQ6_K[36864 4608]
-
blk.16.ffn_gate.weightQ6_K[4608 36864]
-
blk.16.ffn_up.weightQ6_K[4608 36864]
-
blk.16.post_attention_norm.weightF32[4608]
-
blk.16.post_ffw_norm.weightF32[4608]
-
blk.16.ffn_norm.weightF32[4608]
-
blk.16.attn_k.weightQ6_K[4608 2048]
-
blk.16.attn_output.weightQ6_K[4096 4608]
-
blk.16.attn_q.weightQ6_K[4608 4096]
-
blk.16.attn_v.weightQ6_K[4608 2048]
-
blk.17.attn_norm.weightF32[4608]
-
blk.17.ffn_down.weightQ6_K[36864 4608]
-
blk.17.ffn_gate.weightQ6_K[4608 36864]
-
blk.17.ffn_up.weightQ6_K[4608 36864]
-
blk.17.post_attention_norm.weightF32[4608]
-
blk.17.post_ffw_norm.weightF32[4608]
-
blk.17.ffn_norm.weightF32[4608]
-
blk.17.attn_k.weightQ6_K[4608 2048]
-
blk.17.attn_output.weightQ6_K[4096 4608]
-
blk.17.attn_q.weightQ6_K[4608 4096]
-
blk.17.attn_v.weightQ6_K[4608 2048]
-
blk.18.attn_norm.weightF32[4608]
-
blk.18.ffn_down.weightQ6_K[36864 4608]
-
blk.18.ffn_gate.weightQ6_K[4608 36864]
-
blk.18.ffn_up.weightQ6_K[4608 36864]
-
blk.18.post_attention_norm.weightF32[4608]
-
blk.18.post_ffw_norm.weightF32[4608]
-
blk.18.ffn_norm.weightF32[4608]
-
blk.18.attn_k.weightQ6_K[4608 2048]
-
blk.18.attn_output.weightQ6_K[4096 4608]
-
blk.18.attn_q.weightQ6_K[4608 4096]
-
blk.18.attn_v.weightQ6_K[4608 2048]
-
blk.19.attn_norm.weightF32[4608]
-
blk.19.ffn_down.weightQ6_K[36864 4608]
-
blk.19.ffn_gate.weightQ6_K[4608 36864]
-
blk.19.ffn_up.weightQ6_K[4608 36864]
-
blk.19.post_attention_norm.weightF32[4608]
-
blk.19.post_ffw_norm.weightF32[4608]
-
blk.19.ffn_norm.weightF32[4608]
-
blk.19.attn_k.weightQ6_K[4608 2048]
-
blk.19.attn_output.weightQ6_K[4096 4608]
-
blk.19.attn_q.weightQ6_K[4608 4096]
-
blk.19.attn_v.weightQ6_K[4608 2048]
-
blk.20.attn_norm.weightF32[4608]
-
blk.20.ffn_down.weightQ6_K[36864 4608]
-
blk.20.ffn_gate.weightQ6_K[4608 36864]
-
blk.20.ffn_up.weightQ6_K[4608 36864]
-
blk.20.post_attention_norm.weightF32[4608]
-
blk.20.post_ffw_norm.weightF32[4608]
-
blk.20.ffn_norm.weightF32[4608]
-
blk.20.attn_k.weightQ6_K[4608 2048]
-
blk.20.attn_output.weightQ6_K[4096 4608]
-
blk.20.attn_q.weightQ6_K[4608 4096]
-
blk.20.attn_v.weightQ6_K[4608 2048]
-
blk.21.attn_norm.weightF32[4608]
-
blk.21.ffn_down.weightQ6_K[36864 4608]
-
blk.21.ffn_gate.weightQ6_K[4608 36864]
-
blk.21.ffn_up.weightQ6_K[4608 36864]
-
blk.21.post_attention_norm.weightF32[4608]
-
blk.21.post_ffw_norm.weightF32[4608]
-
blk.21.ffn_norm.weightF32[4608]
-
blk.21.attn_k.weightQ6_K[4608 2048]
-
blk.21.attn_output.weightQ6_K[4096 4608]
-
blk.21.attn_q.weightQ6_K[4608 4096]
-
blk.21.attn_v.weightQ6_K[4608 2048]
-
blk.22.attn_norm.weightF32[4608]
-
blk.22.ffn_down.weightQ6_K[36864 4608]
-
blk.22.ffn_gate.weightQ6_K[4608 36864]
-
blk.22.ffn_up.weightQ6_K[4608 36864]
-
blk.22.post_attention_norm.weightF32[4608]
-
blk.22.post_ffw_norm.weightF32[4608]
-
blk.22.ffn_norm.weightF32[4608]
-
blk.22.attn_k.weightQ6_K[4608 2048]
-
blk.22.attn_output.weightQ6_K[4096 4608]
-
blk.22.attn_q.weightQ6_K[4608 4096]
-
blk.22.attn_v.weightQ6_K[4608 2048]
-
blk.23.attn_norm.weightF32[4608]
-
blk.23.ffn_down.weightQ6_K[36864 4608]
-
blk.23.ffn_gate.weightQ6_K[4608 36864]
-
blk.23.ffn_up.weightQ6_K[4608 36864]
-
blk.23.post_attention_norm.weightF32[4608]
-
blk.23.post_ffw_norm.weightF32[4608]
-
blk.23.ffn_norm.weightF32[4608]
-
blk.23.attn_k.weightQ6_K[4608 2048]
-
blk.23.attn_output.weightQ6_K[4096 4608]
-
blk.23.attn_q.weightQ6_K[4608 4096]
-
blk.23.attn_v.weightQ6_K[4608 2048]
-
blk.24.attn_norm.weightF32[4608]
-
blk.24.ffn_down.weightQ6_K[36864 4608]
-
blk.24.ffn_gate.weightQ6_K[4608 36864]
-
blk.24.ffn_up.weightQ6_K[4608 36864]
-
blk.24.post_attention_norm.weightF32[4608]
-
blk.24.post_ffw_norm.weightF32[4608]
-
blk.24.ffn_norm.weightF32[4608]
-
blk.24.attn_k.weightQ6_K[4608 2048]
-
blk.24.attn_output.weightQ6_K[4096 4608]
-
blk.24.attn_q.weightQ6_K[4608 4096]
-
blk.24.attn_v.weightQ6_K[4608 2048]
-
blk.25.attn_norm.weightF32[4608]
-
blk.25.ffn_down.weightQ6_K[36864 4608]
-
blk.25.ffn_gate.weightQ6_K[4608 36864]
-
blk.25.ffn_up.weightQ6_K[4608 36864]
-
blk.25.post_attention_norm.weightF32[4608]
-
blk.25.post_ffw_norm.weightF32[4608]
-
blk.25.ffn_norm.weightF32[4608]
-
blk.25.attn_k.weightQ6_K[4608 2048]
-
blk.25.attn_output.weightQ6_K[4096 4608]
-
blk.25.attn_q.weightQ6_K[4608 4096]
-
blk.25.attn_v.weightQ6_K[4608 2048]
-
blk.26.attn_norm.weightF32[4608]
-
blk.26.ffn_down.weightQ6_K[36864 4608]
-
blk.26.ffn_gate.weightQ6_K[4608 36864]
-
blk.26.ffn_up.weightQ6_K[4608 36864]
-
blk.26.post_attention_norm.weightF32[4608]
-
blk.26.post_ffw_norm.weightF32[4608]
-
blk.26.ffn_norm.weightF32[4608]
-
blk.26.attn_k.weightQ6_K[4608 2048]
-
blk.26.attn_output.weightQ6_K[4096 4608]
-
blk.26.attn_q.weightQ6_K[4608 4096]
-
blk.26.attn_v.weightQ6_K[4608 2048]
-
blk.27.attn_norm.weightF32[4608]
-
blk.27.ffn_down.weightQ6_K[36864 4608]
-
blk.27.ffn_gate.weightQ6_K[4608 36864]
-
blk.27.ffn_up.weightQ6_K[4608 36864]
-
blk.27.post_attention_norm.weightF32[4608]
-
blk.27.post_ffw_norm.weightF32[4608]
-
blk.27.ffn_norm.weightF32[4608]
-
blk.27.attn_k.weightQ6_K[4608 2048]
-
blk.27.attn_output.weightQ6_K[4096 4608]
-
blk.27.attn_q.weightQ6_K[4608 4096]
-
blk.27.attn_v.weightQ6_K[4608 2048]
-
blk.28.attn_norm.weightF32[4608]
-
blk.28.ffn_down.weightQ6_K[36864 4608]
-
blk.28.ffn_gate.weightQ6_K[4608 36864]
-
blk.28.ffn_up.weightQ6_K[4608 36864]
-
blk.28.post_attention_norm.weightF32[4608]
-
blk.28.post_ffw_norm.weightF32[4608]
-
blk.28.ffn_norm.weightF32[4608]
-
blk.28.attn_k.weightQ6_K[4608 2048]
-
blk.28.attn_output.weightQ6_K[4096 4608]
-
blk.28.attn_q.weightQ6_K[4608 4096]
-
blk.28.attn_v.weightQ6_K[4608 2048]
-
blk.29.attn_norm.weightF32[4608]
-
blk.29.ffn_down.weightQ6_K[36864 4608]
-
blk.29.ffn_gate.weightQ6_K[4608 36864]
-
blk.29.ffn_up.weightQ6_K[4608 36864]
-
blk.29.post_attention_norm.weightF32[4608]
-
blk.29.post_ffw_norm.weightF32[4608]
-
blk.29.ffn_norm.weightF32[4608]
-
blk.29.attn_k.weightQ6_K[4608 2048]
-
blk.29.attn_output.weightQ6_K[4096 4608]
-
blk.29.attn_q.weightQ6_K[4608 4096]
-
blk.29.attn_v.weightQ6_K[4608 2048]
-
blk.30.attn_norm.weightF32[4608]
-
blk.30.ffn_down.weightQ6_K[36864 4608]
-
blk.30.ffn_gate.weightQ6_K[4608 36864]
-
blk.30.ffn_up.weightQ6_K[4608 36864]
-
blk.30.post_attention_norm.weightF32[4608]
-
blk.30.post_ffw_norm.weightF32[4608]
-
blk.30.ffn_norm.weightF32[4608]
-
blk.30.attn_k.weightQ6_K[4608 2048]
-
blk.30.attn_output.weightQ6_K[4096 4608]
-
blk.30.attn_q.weightQ6_K[4608 4096]
-
blk.30.attn_v.weightQ6_K[4608 2048]
-
blk.31.attn_norm.weightF32[4608]
-
blk.31.ffn_down.weightQ6_K[36864 4608]
-
blk.31.ffn_gate.weightQ6_K[4608 36864]
-
blk.31.ffn_up.weightQ6_K[4608 36864]
-
blk.31.post_attention_norm.weightF32[4608]
-
blk.31.post_ffw_norm.weightF32[4608]
-
blk.31.ffn_norm.weightF32[4608]
-
blk.31.attn_k.weightQ6_K[4608 2048]
-
blk.31.attn_output.weightQ6_K[4096 4608]
-
blk.31.attn_q.weightQ6_K[4608 4096]
-
blk.31.attn_v.weightQ6_K[4608 2048]
-
blk.32.attn_norm.weightF32[4608]
-
blk.32.ffn_down.weightQ6_K[36864 4608]
-
blk.32.ffn_gate.weightQ6_K[4608 36864]
-
blk.32.ffn_up.weightQ6_K[4608 36864]
-
blk.32.post_attention_norm.weightF32[4608]
-
blk.32.post_ffw_norm.weightF32[4608]
-
blk.32.ffn_norm.weightF32[4608]
-
blk.32.attn_k.weightQ6_K[4608 2048]
-
blk.32.attn_output.weightQ6_K[4096 4608]
-
blk.32.attn_q.weightQ6_K[4608 4096]
-
blk.32.attn_v.weightQ6_K[4608 2048]
-
blk.33.attn_norm.weightF32[4608]
-
blk.33.ffn_down.weightQ6_K[36864 4608]
-
blk.33.ffn_gate.weightQ6_K[4608 36864]
-
blk.33.ffn_up.weightQ6_K[4608 36864]
-
blk.33.post_attention_norm.weightF32[4608]
-
blk.33.post_ffw_norm.weightF32[4608]
-
blk.33.ffn_norm.weightF32[4608]
-
blk.33.attn_k.weightQ6_K[4608 2048]
-
blk.33.attn_output.weightQ6_K[4096 4608]
-
blk.33.attn_q.weightQ6_K[4608 4096]
-
blk.33.attn_v.weightQ6_K[4608 2048]
-
blk.34.attn_norm.weightF32[4608]
-
blk.34.ffn_down.weightQ6_K[36864 4608]
-
blk.34.ffn_gate.weightQ6_K[4608 36864]
-
blk.34.ffn_up.weightQ6_K[4608 36864]
-
blk.34.post_attention_norm.weightF32[4608]
-
blk.34.post_ffw_norm.weightF32[4608]
-
blk.34.ffn_norm.weightF32[4608]
-
blk.34.attn_k.weightQ6_K[4608 2048]
-
blk.34.attn_output.weightQ6_K[4096 4608]
-
blk.34.attn_q.weightQ6_K[4608 4096]
-
blk.34.attn_v.weightQ6_K[4608 2048]
-
blk.35.attn_norm.weightF32[4608]
-
blk.35.ffn_down.weightQ6_K[36864 4608]
-
blk.35.ffn_gate.weightQ6_K[4608 36864]
-
blk.35.ffn_up.weightQ6_K[4608 36864]
-
blk.35.post_attention_norm.weightF32[4608]
-
blk.35.post_ffw_norm.weightF32[4608]
-
blk.35.ffn_norm.weightF32[4608]
-
blk.35.attn_k.weightQ6_K[4608 2048]
-
blk.35.attn_output.weightQ6_K[4096 4608]
-
blk.35.attn_q.weightQ6_K[4608 4096]
-
blk.35.attn_v.weightQ6_K[4608 2048]
-
blk.36.attn_norm.weightF32[4608]
-
blk.36.ffn_down.weightQ6_K[36864 4608]
-
blk.36.ffn_gate.weightQ6_K[4608 36864]
-
blk.36.ffn_up.weightQ6_K[4608 36864]
-
blk.36.post_attention_norm.weightF32[4608]
-
blk.36.post_ffw_norm.weightF32[4608]
-
blk.36.ffn_norm.weightF32[4608]
-
blk.36.attn_k.weightQ6_K[4608 2048]
-
blk.36.attn_output.weightQ6_K[4096 4608]
-
blk.36.attn_q.weightQ6_K[4608 4096]
-
blk.36.attn_v.weightQ6_K[4608 2048]
-
blk.37.attn_norm.weightF32[4608]
-
blk.37.ffn_down.weightQ6_K[36864 4608]
-
blk.37.ffn_gate.weightQ6_K[4608 36864]
-
blk.37.ffn_up.weightQ6_K[4608 36864]
-
blk.37.post_attention_norm.weightF32[4608]
-
blk.37.post_ffw_norm.weightF32[4608]
-
blk.37.ffn_norm.weightF32[4608]
-
blk.37.attn_k.weightQ6_K[4608 2048]
-
blk.37.attn_output.weightQ6_K[4096 4608]
-
blk.37.attn_q.weightQ6_K[4608 4096]
-
blk.37.attn_v.weightQ6_K[4608 2048]
-
blk.38.attn_norm.weightF32[4608]
-
blk.38.ffn_down.weightQ6_K[36864 4608]
-
blk.38.ffn_gate.weightQ6_K[4608 36864]
-
blk.38.ffn_up.weightQ6_K[4608 36864]
-
blk.38.post_attention_norm.weightF32[4608]
-
blk.38.post_ffw_norm.weightF32[4608]
-
blk.38.ffn_norm.weightF32[4608]
-
blk.38.attn_k.weightQ6_K[4608 2048]
-
blk.38.attn_output.weightQ6_K[4096 4608]
-
blk.38.attn_q.weightQ6_K[4608 4096]
-
blk.38.attn_v.weightQ6_K[4608 2048]
-
blk.39.attn_norm.weightF32[4608]
-
blk.39.ffn_down.weightQ6_K[36864 4608]
-
blk.39.ffn_gate.weightQ6_K[4608 36864]
-
blk.39.ffn_up.weightQ6_K[4608 36864]
-
blk.39.post_attention_norm.weightF32[4608]
-
blk.39.post_ffw_norm.weightF32[4608]
-
blk.39.ffn_norm.weightF32[4608]
-
blk.39.attn_k.weightQ6_K[4608 2048]
-
blk.39.attn_output.weightQ6_K[4096 4608]
-
blk.39.attn_q.weightQ6_K[4608 4096]
-
blk.39.attn_v.weightQ6_K[4608 2048]
-
blk.40.attn_norm.weightF32[4608]
-
blk.40.ffn_down.weightQ6_K[36864 4608]
-
blk.40.ffn_gate.weightQ6_K[4608 36864]
-
blk.40.ffn_up.weightQ6_K[4608 36864]
-
blk.40.post_attention_norm.weightF32[4608]
-
blk.40.post_ffw_norm.weightF32[4608]
-
blk.40.ffn_norm.weightF32[4608]
-
blk.40.attn_k.weightQ6_K[4608 2048]
-
blk.40.attn_output.weightQ6_K[4096 4608]
-
blk.40.attn_q.weightQ6_K[4608 4096]
-
blk.40.attn_v.weightQ6_K[4608 2048]
-
blk.41.attn_norm.weightF32[4608]
-
blk.41.ffn_down.weightQ6_K[36864 4608]
-
blk.41.ffn_gate.weightQ6_K[4608 36864]
-
blk.41.ffn_up.weightQ6_K[4608 36864]
-
blk.41.post_attention_norm.weightF32[4608]
-
blk.41.post_ffw_norm.weightF32[4608]
-
blk.41.ffn_norm.weightF32[4608]
-
blk.41.attn_k.weightQ6_K[4608 2048]
-
blk.41.attn_output.weightQ6_K[4096 4608]
-
blk.41.attn_q.weightQ6_K[4608 4096]
-
blk.41.attn_v.weightQ6_K[4608 2048]
-
blk.42.attn_norm.weightF32[4608]
-
blk.42.ffn_down.weightQ6_K[36864 4608]
-
blk.42.ffn_gate.weightQ6_K[4608 36864]
-
blk.42.ffn_up.weightQ6_K[4608 36864]
-
blk.42.post_attention_norm.weightF32[4608]
-
blk.42.post_ffw_norm.weightF32[4608]
-
blk.42.ffn_norm.weightF32[4608]
-
blk.42.attn_k.weightQ6_K[4608 2048]
-
blk.42.attn_output.weightQ6_K[4096 4608]
-
blk.42.attn_q.weightQ6_K[4608 4096]
-
blk.42.attn_v.weightQ6_K[4608 2048]
-
blk.43.attn_norm.weightF32[4608]
-
blk.43.ffn_down.weightQ6_K[36864 4608]
-
blk.43.ffn_gate.weightQ6_K[4608 36864]
-
blk.43.ffn_up.weightQ6_K[4608 36864]
-
blk.43.post_attention_norm.weightF32[4608]
-
blk.43.post_ffw_norm.weightF32[4608]
-
blk.43.ffn_norm.weightF32[4608]
-
blk.43.attn_k.weightQ6_K[4608 2048]
-
blk.43.attn_output.weightQ6_K[4096 4608]
-
blk.43.attn_q.weightQ6_K[4608 4096]
-
blk.43.attn_v.weightQ6_K[4608 2048]
-
blk.44.attn_norm.weightF32[4608]
-
blk.44.ffn_down.weightQ6_K[36864 4608]
-
blk.44.ffn_gate.weightQ6_K[4608 36864]
-
blk.44.ffn_up.weightQ6_K[4608 36864]
-
blk.44.post_attention_norm.weightF32[4608]
-
blk.44.post_ffw_norm.weightF32[4608]
-
blk.44.ffn_norm.weightF32[4608]
-
blk.44.attn_k.weightQ6_K[4608 2048]
-
blk.44.attn_output.weightQ6_K[4096 4608]
-
blk.44.attn_q.weightQ6_K[4608 4096]
-
blk.44.attn_v.weightQ6_K[4608 2048]
-
blk.45.attn_norm.weightF32[4608]
-
blk.45.ffn_down.weightQ6_K[36864 4608]
-
blk.45.ffn_gate.weightQ6_K[4608 36864]
-
blk.45.ffn_up.weightQ6_K[4608 36864]
-
blk.45.post_attention_norm.weightF32[4608]
-
blk.45.post_ffw_norm.weightF32[4608]
-
blk.45.ffn_norm.weightF32[4608]
-
blk.45.attn_k.weightQ6_K[4608 2048]
-
blk.45.attn_output.weightQ6_K[4096 4608]
-
blk.45.attn_q.weightQ6_K[4608 4096]
-
blk.45.attn_v.weightQ6_K[4608 2048]
-
output_norm.weightF32[4608]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45