UNA SimpleSmaug 34b v1beta Q4_K_M GGUF
34B
58 Pulls Updated 5 months ago
d8a862bc3614 · 21GB
-
general.architecturellama
-
general.file_typeQ4_K_M
-
llama.attention.head_count56
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count60
-
llama.context_length32768
-
llama.embedding_length7168
-
llama.feed_forward_length20480
-
llama.rope.dimension_count128
-
llama.rope.freq_base5e+06
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id0
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[2 3 3 3 3 ...]
-
tokenizer.ggml.tokens[<unk> <|startoftext|> <|endoftext|> <|Human|> <|Assistant|> ...]
-
NameTypeShape
-
token_embd.weightQ4_K[7168 64000]
-
blk.0.attn_norm.weightF32[7168]
-
blk.0.ffn_down.weightQ6_K[20480 7168]
-
blk.0.ffn_gate.weightQ4_K[7168 20480]
-
blk.0.ffn_up.weightQ4_K[7168 20480]
-
blk.0.ffn_norm.weightF32[7168]
-
blk.0.attn_k.weightQ4_K[7168 1024]
-
blk.0.attn_output.weightQ4_K[7168 7168]
-
blk.0.attn_q.weightQ4_K[7168 7168]
-
blk.0.attn_v.weightQ6_K[7168 1024]
-
blk.1.attn_norm.weightF32[7168]
-
blk.1.ffn_down.weightQ6_K[20480 7168]
-
blk.1.ffn_gate.weightQ4_K[7168 20480]
-
blk.1.ffn_up.weightQ4_K[7168 20480]
-
blk.1.ffn_norm.weightF32[7168]
-
blk.1.attn_k.weightQ4_K[7168 1024]
-
blk.1.attn_output.weightQ4_K[7168 7168]
-
blk.1.attn_q.weightQ4_K[7168 7168]
-
blk.1.attn_v.weightQ6_K[7168 1024]
-
blk.2.attn_norm.weightF32[7168]
-
blk.2.ffn_down.weightQ6_K[20480 7168]
-
blk.2.ffn_gate.weightQ4_K[7168 20480]
-
blk.2.ffn_up.weightQ4_K[7168 20480]
-
blk.2.ffn_norm.weightF32[7168]
-
blk.2.attn_k.weightQ4_K[7168 1024]
-
blk.2.attn_output.weightQ4_K[7168 7168]
-
blk.2.attn_q.weightQ4_K[7168 7168]
-
blk.2.attn_v.weightQ6_K[7168 1024]
-
blk.3.ffn_gate.weightQ4_K[7168 20480]
-
blk.3.attn_k.weightQ4_K[7168 1024]
-
blk.3.attn_output.weightQ4_K[7168 7168]
-
blk.3.attn_q.weightQ4_K[7168 7168]
-
blk.3.attn_v.weightQ6_K[7168 1024]
-
blk.3.attn_norm.weightF32[7168]
-
blk.3.ffn_down.weightQ6_K[20480 7168]
-
blk.3.ffn_up.weightQ4_K[7168 20480]
-
blk.3.ffn_norm.weightF32[7168]
-
blk.4.attn_norm.weightF32[7168]
-
blk.4.ffn_down.weightQ6_K[20480 7168]
-
blk.4.ffn_gate.weightQ4_K[7168 20480]
-
blk.4.ffn_up.weightQ4_K[7168 20480]
-
blk.4.ffn_norm.weightF32[7168]
-
blk.4.attn_k.weightQ4_K[7168 1024]
-
blk.4.attn_output.weightQ4_K[7168 7168]
-
blk.4.attn_q.weightQ4_K[7168 7168]
-
blk.4.attn_v.weightQ6_K[7168 1024]
-
blk.5.attn_norm.weightF32[7168]
-
blk.5.ffn_down.weightQ6_K[20480 7168]
-
blk.5.ffn_gate.weightQ4_K[7168 20480]
-
blk.5.ffn_up.weightQ4_K[7168 20480]
-
blk.5.ffn_norm.weightF32[7168]
-
blk.5.attn_k.weightQ4_K[7168 1024]
-
blk.5.attn_output.weightQ4_K[7168 7168]
-
blk.5.attn_q.weightQ4_K[7168 7168]
-
blk.5.attn_v.weightQ6_K[7168 1024]
-
blk.6.attn_norm.weightF32[7168]
-
blk.6.ffn_down.weightQ6_K[20480 7168]
-
blk.6.ffn_gate.weightQ4_K[7168 20480]
-
blk.6.ffn_up.weightQ4_K[7168 20480]
-
blk.6.ffn_norm.weightF32[7168]
-
blk.6.attn_k.weightQ4_K[7168 1024]
-
blk.6.attn_output.weightQ4_K[7168 7168]
-
blk.6.attn_q.weightQ4_K[7168 7168]
-
blk.6.attn_v.weightQ6_K[7168 1024]
-
blk.7.ffn_gate.weightQ4_K[7168 20480]
-
blk.7.ffn_up.weightQ4_K[7168 20480]
-
blk.7.attn_k.weightQ4_K[7168 1024]
-
blk.7.attn_output.weightQ4_K[7168 7168]
-
blk.7.attn_q.weightQ4_K[7168 7168]
-
blk.7.attn_v.weightQ4_K[7168 1024]
-
blk.7.attn_norm.weightF32[7168]
-
blk.7.ffn_down.weightQ6_K[20480 7168]
-
blk.7.ffn_norm.weightF32[7168]
-
blk.8.attn_norm.weightF32[7168]
-
blk.8.ffn_down.weightQ4_K[20480 7168]
-
blk.8.ffn_gate.weightQ4_K[7168 20480]
-
blk.8.ffn_up.weightQ4_K[7168 20480]
-
blk.8.ffn_norm.weightF32[7168]
-
blk.8.attn_k.weightQ4_K[7168 1024]
-
blk.8.attn_output.weightQ4_K[7168 7168]
-
blk.8.attn_q.weightQ4_K[7168 7168]
-
blk.8.attn_v.weightQ4_K[7168 1024]
-
blk.9.attn_norm.weightF32[7168]
-
blk.9.ffn_down.weightQ4_K[20480 7168]
-
blk.9.ffn_gate.weightQ4_K[7168 20480]
-
blk.9.ffn_up.weightQ4_K[7168 20480]
-
blk.9.ffn_norm.weightF32[7168]
-
blk.9.attn_k.weightQ4_K[7168 1024]
-
blk.9.attn_output.weightQ4_K[7168 7168]
-
blk.9.attn_q.weightQ4_K[7168 7168]
-
blk.9.attn_v.weightQ6_K[7168 1024]
-
blk.10.attn_norm.weightF32[7168]
-
blk.10.ffn_down.weightQ4_K[20480 7168]
-
blk.10.ffn_gate.weightQ4_K[7168 20480]
-
blk.10.ffn_up.weightQ4_K[7168 20480]
-
blk.10.ffn_norm.weightF32[7168]
-
blk.10.attn_k.weightQ4_K[7168 1024]
-
blk.10.attn_output.weightQ4_K[7168 7168]
-
blk.10.attn_q.weightQ4_K[7168 7168]
-
blk.10.attn_v.weightQ4_K[7168 1024]
-
blk.11.attn_norm.weightF32[7168]
-
blk.11.ffn_down.weightQ4_K[20480 7168]
-
blk.11.ffn_gate.weightQ4_K[7168 20480]
-
blk.11.ffn_up.weightQ4_K[7168 20480]
-
blk.11.ffn_norm.weightF32[7168]
-
blk.11.attn_k.weightQ4_K[7168 1024]
-
blk.11.attn_output.weightQ4_K[7168 7168]
-
blk.11.attn_q.weightQ4_K[7168 7168]
-
blk.11.attn_v.weightQ6_K[7168 1024]
-
blk.12.attn_k.weightQ4_K[7168 1024]
-
blk.12.attn_output.weightQ4_K[7168 7168]
-
blk.12.attn_q.weightQ4_K[7168 7168]
-
blk.12.attn_v.weightQ4_K[7168 1024]
-
blk.12.attn_norm.weightF32[7168]
-
blk.12.ffn_down.weightQ6_K[20480 7168]
-
blk.12.ffn_gate.weightQ4_K[7168 20480]
-
blk.12.ffn_up.weightQ4_K[7168 20480]
-
blk.12.ffn_norm.weightF32[7168]
-
blk.13.attn_norm.weightF32[7168]
-
blk.13.ffn_down.weightQ4_K[20480 7168]
-
blk.13.ffn_gate.weightQ4_K[7168 20480]
-
blk.13.ffn_up.weightQ4_K[7168 20480]
-
blk.13.ffn_norm.weightF32[7168]
-
blk.13.attn_k.weightQ4_K[7168 1024]
-
blk.13.attn_output.weightQ4_K[7168 7168]
-
blk.13.attn_q.weightQ4_K[7168 7168]
-
blk.13.attn_v.weightQ4_K[7168 1024]
-
blk.14.attn_norm.weightF32[7168]
-
blk.14.ffn_down.weightQ4_K[20480 7168]
-
blk.14.ffn_gate.weightQ4_K[7168 20480]
-
blk.14.ffn_up.weightQ4_K[7168 20480]
-
blk.14.ffn_norm.weightF32[7168]
-
blk.14.attn_k.weightQ4_K[7168 1024]
-
blk.14.attn_output.weightQ4_K[7168 7168]
-
blk.14.attn_q.weightQ4_K[7168 7168]
-
blk.14.attn_v.weightQ4_K[7168 1024]
-
blk.15.attn_norm.weightF32[7168]
-
blk.15.ffn_down.weightQ6_K[20480 7168]
-
blk.15.ffn_gate.weightQ4_K[7168 20480]
-
blk.15.ffn_up.weightQ4_K[7168 20480]
-
blk.15.ffn_norm.weightF32[7168]
-
blk.15.attn_k.weightQ4_K[7168 1024]
-
blk.15.attn_output.weightQ4_K[7168 7168]
-
blk.15.attn_q.weightQ4_K[7168 7168]
-
blk.15.attn_v.weightQ6_K[7168 1024]
-
blk.16.ffn_gate.weightQ4_K[7168 20480]
-
blk.16.attn_k.weightQ4_K[7168 1024]
-
blk.16.attn_output.weightQ4_K[7168 7168]
-
blk.16.attn_q.weightQ4_K[7168 7168]
-
blk.16.attn_v.weightQ4_K[7168 1024]
-
blk.16.attn_norm.weightF32[7168]
-
blk.16.ffn_down.weightQ4_K[20480 7168]
-
blk.16.ffn_up.weightQ4_K[7168 20480]
-
blk.16.ffn_norm.weightF32[7168]
-
blk.17.attn_norm.weightF32[7168]
-
blk.17.ffn_down.weightQ4_K[20480 7168]
-
blk.17.ffn_gate.weightQ4_K[7168 20480]
-
blk.17.ffn_up.weightQ4_K[7168 20480]
-
blk.17.ffn_norm.weightF32[7168]
-
blk.17.attn_k.weightQ4_K[7168 1024]
-
blk.17.attn_output.weightQ4_K[7168 7168]
-
blk.17.attn_q.weightQ4_K[7168 7168]
-
blk.17.attn_v.weightQ4_K[7168 1024]
-
blk.18.attn_norm.weightF32[7168]
-
blk.18.ffn_down.weightQ6_K[20480 7168]
-
blk.18.ffn_gate.weightQ4_K[7168 20480]
-
blk.18.ffn_up.weightQ4_K[7168 20480]
-
blk.18.ffn_norm.weightF32[7168]
-
blk.18.attn_k.weightQ4_K[7168 1024]
-
blk.18.attn_output.weightQ4_K[7168 7168]
-
blk.18.attn_q.weightQ4_K[7168 7168]
-
blk.18.attn_v.weightQ6_K[7168 1024]
-
blk.19.attn_norm.weightF32[7168]
-
blk.19.ffn_down.weightQ4_K[20480 7168]
-
blk.19.ffn_gate.weightQ4_K[7168 20480]
-
blk.19.ffn_up.weightQ4_K[7168 20480]
-
blk.19.ffn_norm.weightF32[7168]
-
blk.19.attn_k.weightQ4_K[7168 1024]
-
blk.19.attn_output.weightQ4_K[7168 7168]
-
blk.19.attn_q.weightQ4_K[7168 7168]
-
blk.19.attn_v.weightQ4_K[7168 1024]
-
blk.20.ffn_gate.weightQ4_K[7168 20480]
-
blk.20.ffn_up.weightQ4_K[7168 20480]
-
blk.20.attn_k.weightQ4_K[7168 1024]
-
blk.20.attn_output.weightQ4_K[7168 7168]
-
blk.20.attn_q.weightQ4_K[7168 7168]
-
blk.20.attn_v.weightQ4_K[7168 1024]
-
blk.20.attn_norm.weightF32[7168]
-
blk.20.ffn_down.weightQ4_K[20480 7168]
-
blk.20.ffn_norm.weightF32[7168]
-
blk.21.attn_norm.weightF32[7168]
-
blk.21.ffn_down.weightQ6_K[20480 7168]
-
blk.21.ffn_gate.weightQ4_K[7168 20480]
-
blk.21.ffn_up.weightQ4_K[7168 20480]
-
blk.21.ffn_norm.weightF32[7168]
-
blk.21.attn_k.weightQ4_K[7168 1024]
-
blk.21.attn_output.weightQ4_K[7168 7168]
-
blk.21.attn_q.weightQ4_K[7168 7168]
-
blk.21.attn_v.weightQ6_K[7168 1024]
-
blk.22.attn_norm.weightF32[7168]
-
blk.22.ffn_down.weightQ4_K[20480 7168]
-
blk.22.ffn_gate.weightQ4_K[7168 20480]
-
blk.22.ffn_up.weightQ4_K[7168 20480]
-
blk.22.ffn_norm.weightF32[7168]
-
blk.22.attn_k.weightQ4_K[7168 1024]
-
blk.22.attn_output.weightQ4_K[7168 7168]
-
blk.22.attn_q.weightQ4_K[7168 7168]
-
blk.22.attn_v.weightQ4_K[7168 1024]
-
blk.23.attn_norm.weightF32[7168]
-
blk.23.ffn_down.weightQ4_K[20480 7168]
-
blk.23.ffn_gate.weightQ4_K[7168 20480]
-
blk.23.ffn_up.weightQ4_K[7168 20480]
-
blk.23.ffn_norm.weightF32[7168]
-
blk.23.attn_k.weightQ4_K[7168 1024]
-
blk.23.attn_output.weightQ4_K[7168 7168]
-
blk.23.attn_q.weightQ4_K[7168 7168]
-
blk.23.attn_v.weightQ4_K[7168 1024]
-
blk.24.attn_norm.weightF32[7168]
-
blk.24.ffn_down.weightQ6_K[20480 7168]
-
blk.24.ffn_gate.weightQ4_K[7168 20480]
-
blk.24.ffn_up.weightQ4_K[7168 20480]
-
blk.24.ffn_norm.weightF32[7168]
-
blk.24.attn_k.weightQ4_K[7168 1024]
-
blk.24.attn_output.weightQ4_K[7168 7168]
-
blk.24.attn_q.weightQ4_K[7168 7168]
-
blk.24.attn_v.weightQ6_K[7168 1024]
-
blk.25.attn_k.weightQ4_K[7168 1024]
-
blk.25.attn_output.weightQ4_K[7168 7168]
-
blk.25.attn_q.weightQ4_K[7168 7168]
-
blk.25.attn_v.weightQ4_K[7168 1024]
-
blk.25.attn_norm.weightF32[7168]
-
blk.25.ffn_down.weightQ4_K[20480 7168]
-
blk.25.ffn_gate.weightQ4_K[7168 20480]
-
blk.25.ffn_up.weightQ4_K[7168 20480]
-
blk.25.ffn_norm.weightF32[7168]
-
blk.26.attn_norm.weightF32[7168]
-
blk.26.ffn_down.weightQ4_K[20480 7168]
-
blk.26.ffn_gate.weightQ4_K[7168 20480]
-
blk.26.ffn_up.weightQ4_K[7168 20480]
-
blk.26.ffn_norm.weightF32[7168]
-
blk.26.attn_k.weightQ4_K[7168 1024]
-
blk.26.attn_output.weightQ4_K[7168 7168]
-
blk.26.attn_q.weightQ4_K[7168 7168]
-
blk.26.attn_v.weightQ4_K[7168 1024]
-
blk.27.attn_norm.weightF32[7168]
-
blk.27.ffn_down.weightQ6_K[20480 7168]
-
blk.27.ffn_gate.weightQ4_K[7168 20480]
-
blk.27.ffn_up.weightQ4_K[7168 20480]
-
blk.27.ffn_norm.weightF32[7168]
-
blk.27.attn_k.weightQ4_K[7168 1024]
-
blk.27.attn_output.weightQ4_K[7168 7168]
-
blk.27.attn_q.weightQ4_K[7168 7168]
-
blk.27.attn_v.weightQ6_K[7168 1024]
-
blk.28.attn_norm.weightF32[7168]
-
blk.28.ffn_down.weightQ4_K[20480 7168]
-
blk.28.ffn_gate.weightQ4_K[7168 20480]
-
blk.28.ffn_up.weightQ4_K[7168 20480]
-
blk.28.ffn_norm.weightF32[7168]
-
blk.28.attn_k.weightQ4_K[7168 1024]
-
blk.28.attn_output.weightQ4_K[7168 7168]
-
blk.28.attn_q.weightQ4_K[7168 7168]
-
blk.28.attn_v.weightQ4_K[7168 1024]
-
blk.29.ffn_gate.weightQ4_K[7168 20480]
-
blk.29.attn_k.weightQ4_K[7168 1024]
-
blk.29.attn_output.weightQ4_K[7168 7168]
-
blk.29.attn_q.weightQ4_K[7168 7168]
-
blk.29.attn_v.weightQ4_K[7168 1024]
-
blk.29.attn_norm.weightF32[7168]
-
blk.29.ffn_down.weightQ4_K[20480 7168]
-
blk.29.ffn_up.weightQ4_K[7168 20480]
-
blk.29.ffn_norm.weightF32[7168]
-
blk.30.attn_norm.weightF32[7168]
-
blk.30.ffn_down.weightQ6_K[20480 7168]
-
blk.30.ffn_gate.weightQ4_K[7168 20480]
-
blk.30.ffn_up.weightQ4_K[7168 20480]
-
blk.30.ffn_norm.weightF32[7168]
-
blk.30.attn_k.weightQ4_K[7168 1024]
-
blk.30.attn_output.weightQ4_K[7168 7168]
-
blk.30.attn_q.weightQ4_K[7168 7168]
-
blk.30.attn_v.weightQ6_K[7168 1024]
-
blk.31.attn_norm.weightF32[7168]
-
blk.31.ffn_down.weightQ4_K[20480 7168]
-
blk.31.ffn_gate.weightQ4_K[7168 20480]
-
blk.31.ffn_up.weightQ4_K[7168 20480]
-
blk.31.ffn_norm.weightF32[7168]
-
blk.31.attn_k.weightQ4_K[7168 1024]
-
blk.31.attn_output.weightQ4_K[7168 7168]
-
blk.31.attn_q.weightQ4_K[7168 7168]
-
blk.31.attn_v.weightQ4_K[7168 1024]
-
blk.32.attn_norm.weightF32[7168]
-
blk.32.ffn_down.weightQ4_K[20480 7168]
-
blk.32.ffn_gate.weightQ4_K[7168 20480]
-
blk.32.ffn_up.weightQ4_K[7168 20480]
-
blk.32.ffn_norm.weightF32[7168]
-
blk.32.attn_k.weightQ4_K[7168 1024]
-
blk.32.attn_output.weightQ4_K[7168 7168]
-
blk.32.attn_q.weightQ4_K[7168 7168]
-
blk.32.attn_v.weightQ4_K[7168 1024]
-
blk.33.ffn_gate.weightQ4_K[7168 20480]
-
blk.33.ffn_up.weightQ4_K[7168 20480]
-
blk.33.attn_k.weightQ4_K[7168 1024]
-
blk.33.attn_output.weightQ4_K[7168 7168]
-
blk.33.attn_q.weightQ4_K[7168 7168]
-
blk.33.attn_v.weightQ6_K[7168 1024]
-
blk.33.attn_norm.weightF32[7168]
-
blk.33.ffn_down.weightQ6_K[20480 7168]
-
blk.33.ffn_norm.weightF32[7168]
-
blk.34.attn_norm.weightF32[7168]
-
blk.34.ffn_down.weightQ4_K[20480 7168]
-
blk.34.ffn_gate.weightQ4_K[7168 20480]
-
blk.34.ffn_up.weightQ4_K[7168 20480]
-
blk.34.ffn_norm.weightF32[7168]
-
blk.34.attn_k.weightQ4_K[7168 1024]
-
blk.34.attn_output.weightQ4_K[7168 7168]
-
blk.34.attn_q.weightQ4_K[7168 7168]
-
blk.34.attn_v.weightQ4_K[7168 1024]
-
blk.35.attn_norm.weightF32[7168]
-
blk.35.ffn_down.weightQ4_K[20480 7168]
-
blk.35.ffn_gate.weightQ4_K[7168 20480]
-
blk.35.ffn_up.weightQ4_K[7168 20480]
-
blk.35.ffn_norm.weightF32[7168]
-
blk.35.attn_k.weightQ4_K[7168 1024]
-
blk.35.attn_output.weightQ4_K[7168 7168]
-
blk.35.attn_q.weightQ4_K[7168 7168]
-
blk.35.attn_v.weightQ4_K[7168 1024]
-
blk.36.attn_norm.weightF32[7168]
-
blk.36.ffn_down.weightQ6_K[20480 7168]
-
blk.36.ffn_gate.weightQ4_K[7168 20480]
-
blk.36.ffn_up.weightQ4_K[7168 20480]
-
blk.36.ffn_norm.weightF32[7168]
-
blk.36.attn_k.weightQ4_K[7168 1024]
-
blk.36.attn_output.weightQ4_K[7168 7168]
-
blk.36.attn_q.weightQ4_K[7168 7168]
-
blk.36.attn_v.weightQ6_K[7168 1024]
-
blk.37.attn_norm.weightF32[7168]
-
blk.37.ffn_down.weightQ4_K[20480 7168]
-
blk.37.ffn_gate.weightQ4_K[7168 20480]
-
blk.37.ffn_up.weightQ4_K[7168 20480]
-
blk.37.ffn_norm.weightF32[7168]
-
blk.37.attn_k.weightQ4_K[7168 1024]
-
blk.37.attn_output.weightQ4_K[7168 7168]
-
blk.37.attn_q.weightQ4_K[7168 7168]
-
blk.37.attn_v.weightQ4_K[7168 1024]
-
blk.38.attn_k.weightQ4_K[7168 1024]
-
blk.38.attn_output.weightQ4_K[7168 7168]
-
blk.38.attn_q.weightQ4_K[7168 7168]
-
blk.38.attn_v.weightQ4_K[7168 1024]
-
blk.38.attn_norm.weightF32[7168]
-
blk.38.ffn_down.weightQ4_K[20480 7168]
-
blk.38.ffn_gate.weightQ4_K[7168 20480]
-
blk.38.ffn_up.weightQ4_K[7168 20480]
-
blk.38.ffn_norm.weightF32[7168]
-
blk.39.attn_norm.weightF32[7168]
-
blk.39.ffn_down.weightQ6_K[20480 7168]
-
blk.39.ffn_gate.weightQ4_K[7168 20480]
-
blk.39.ffn_up.weightQ4_K[7168 20480]
-
blk.39.ffn_norm.weightF32[7168]
-
blk.39.attn_k.weightQ4_K[7168 1024]
-
blk.39.attn_output.weightQ4_K[7168 7168]
-
blk.39.attn_q.weightQ4_K[7168 7168]
-
blk.39.attn_v.weightQ6_K[7168 1024]
-
blk.40.attn_norm.weightF32[7168]
-
blk.40.ffn_down.weightQ4_K[20480 7168]
-
blk.40.ffn_gate.weightQ4_K[7168 20480]
-
blk.40.ffn_up.weightQ4_K[7168 20480]
-
blk.40.ffn_norm.weightF32[7168]
-
blk.40.attn_k.weightQ4_K[7168 1024]
-
blk.40.attn_output.weightQ4_K[7168 7168]
-
blk.40.attn_q.weightQ4_K[7168 7168]
-
blk.40.attn_v.weightQ4_K[7168 1024]
-
blk.41.attn_norm.weightF32[7168]
-
blk.41.ffn_down.weightQ4_K[20480 7168]
-
blk.41.ffn_gate.weightQ4_K[7168 20480]
-
blk.41.ffn_up.weightQ4_K[7168 20480]
-
blk.41.ffn_norm.weightF32[7168]
-
blk.41.attn_k.weightQ4_K[7168 1024]
-
blk.41.attn_output.weightQ4_K[7168 7168]
-
blk.41.attn_q.weightQ4_K[7168 7168]
-
blk.41.attn_v.weightQ4_K[7168 1024]
-
blk.42.ffn_gate.weightQ4_K[7168 20480]
-
blk.42.attn_k.weightQ4_K[7168 1024]
-
blk.42.attn_output.weightQ4_K[7168 7168]
-
blk.42.attn_q.weightQ4_K[7168 7168]
-
blk.42.attn_v.weightQ6_K[7168 1024]
-
blk.42.attn_norm.weightF32[7168]
-
blk.42.ffn_down.weightQ6_K[20480 7168]
-
blk.42.ffn_up.weightQ4_K[7168 20480]
-
blk.42.ffn_norm.weightF32[7168]
-
blk.43.attn_norm.weightF32[7168]
-
blk.43.ffn_down.weightQ4_K[20480 7168]
-
blk.43.ffn_gate.weightQ4_K[7168 20480]
-
blk.43.ffn_up.weightQ4_K[7168 20480]
-
blk.43.ffn_norm.weightF32[7168]
-
blk.43.attn_k.weightQ4_K[7168 1024]
-
blk.43.attn_output.weightQ4_K[7168 7168]
-
blk.43.attn_q.weightQ4_K[7168 7168]
-
blk.43.attn_v.weightQ4_K[7168 1024]
-
blk.44.attn_norm.weightF32[7168]
-
blk.44.ffn_down.weightQ4_K[20480 7168]
-
blk.44.ffn_gate.weightQ4_K[7168 20480]
-
blk.44.ffn_up.weightQ4_K[7168 20480]
-
blk.44.ffn_norm.weightF32[7168]
-
blk.44.attn_k.weightQ4_K[7168 1024]
-
blk.44.attn_output.weightQ4_K[7168 7168]
-
blk.44.attn_q.weightQ4_K[7168 7168]
-
blk.44.attn_v.weightQ4_K[7168 1024]
-
blk.45.attn_norm.weightF32[7168]
-
blk.45.ffn_down.weightQ6_K[20480 7168]
-
blk.45.ffn_gate.weightQ4_K[7168 20480]
-
blk.45.ffn_up.weightQ4_K[7168 20480]
-
blk.45.ffn_norm.weightF32[7168]
-
blk.45.attn_k.weightQ4_K[7168 1024]
-
blk.45.attn_output.weightQ4_K[7168 7168]
-
blk.45.attn_q.weightQ4_K[7168 7168]
-
blk.45.attn_v.weightQ6_K[7168 1024]
-
blk.46.ffn_gate.weightQ4_K[7168 20480]
-
blk.46.ffn_up.weightQ4_K[7168 20480]
-
blk.46.attn_k.weightQ4_K[7168 1024]
-
blk.46.attn_output.weightQ4_K[7168 7168]
-
blk.46.attn_q.weightQ4_K[7168 7168]
-
blk.46.attn_v.weightQ4_K[7168 1024]
-
blk.46.attn_norm.weightF32[7168]
-
blk.46.ffn_down.weightQ4_K[20480 7168]
-
blk.46.ffn_norm.weightF32[7168]
-
blk.47.attn_norm.weightF32[7168]
-
blk.47.ffn_down.weightQ4_K[20480 7168]
-
blk.47.ffn_gate.weightQ4_K[7168 20480]
-
blk.47.ffn_up.weightQ4_K[7168 20480]
-
blk.47.ffn_norm.weightF32[7168]
-
blk.47.attn_k.weightQ4_K[7168 1024]
-
blk.47.attn_output.weightQ4_K[7168 7168]
-
blk.47.attn_q.weightQ4_K[7168 7168]
-
blk.47.attn_v.weightQ4_K[7168 1024]
-
blk.48.attn_norm.weightF32[7168]
-
blk.48.ffn_down.weightQ6_K[20480 7168]
-
blk.48.ffn_gate.weightQ4_K[7168 20480]
-
blk.48.ffn_up.weightQ4_K[7168 20480]
-
blk.48.ffn_norm.weightF32[7168]
-
blk.48.attn_k.weightQ4_K[7168 1024]
-
blk.48.attn_output.weightQ4_K[7168 7168]
-
blk.48.attn_q.weightQ4_K[7168 7168]
-
blk.48.attn_v.weightQ6_K[7168 1024]
-
blk.49.attn_norm.weightF32[7168]
-
blk.49.ffn_down.weightQ4_K[20480 7168]
-
blk.49.ffn_gate.weightQ4_K[7168 20480]
-
blk.49.ffn_up.weightQ4_K[7168 20480]
-
blk.49.ffn_norm.weightF32[7168]
-
blk.49.attn_k.weightQ4_K[7168 1024]
-
blk.49.attn_output.weightQ4_K[7168 7168]
-
blk.49.attn_q.weightQ4_K[7168 7168]
-
blk.49.attn_v.weightQ4_K[7168 1024]
-
blk.50.attn_norm.weightF32[7168]
-
blk.50.ffn_down.weightQ4_K[20480 7168]
-
blk.50.ffn_gate.weightQ4_K[7168 20480]
-
blk.50.ffn_up.weightQ4_K[7168 20480]
-
blk.50.ffn_norm.weightF32[7168]
-
blk.50.attn_k.weightQ4_K[7168 1024]
-
blk.50.attn_output.weightQ4_K[7168 7168]
-
blk.50.attn_q.weightQ4_K[7168 7168]
-
blk.50.attn_v.weightQ4_K[7168 1024]
-
blk.51.attn_k.weightQ4_K[7168 1024]
-
blk.51.attn_output.weightQ4_K[7168 7168]
-
blk.51.attn_q.weightQ4_K[7168 7168]
-
blk.51.attn_v.weightQ6_K[7168 1024]
-
blk.51.attn_norm.weightF32[7168]
-
blk.51.ffn_down.weightQ6_K[20480 7168]
-
blk.51.ffn_gate.weightQ4_K[7168 20480]
-
blk.51.ffn_up.weightQ4_K[7168 20480]
-
blk.51.ffn_norm.weightF32[7168]
-
blk.52.attn_norm.weightF32[7168]
-
blk.52.ffn_down.weightQ6_K[20480 7168]
-
blk.52.ffn_gate.weightQ4_K[7168 20480]
-
blk.52.ffn_up.weightQ4_K[7168 20480]
-
blk.52.ffn_norm.weightF32[7168]
-
blk.52.attn_k.weightQ4_K[7168 1024]
-
blk.52.attn_output.weightQ4_K[7168 7168]
-
blk.52.attn_q.weightQ4_K[7168 7168]
-
blk.52.attn_v.weightQ6_K[7168 1024]
-
blk.53.attn_norm.weightF32[7168]
-
blk.53.ffn_down.weightQ6_K[20480 7168]
-
blk.53.ffn_gate.weightQ4_K[7168 20480]
-
blk.53.ffn_up.weightQ4_K[7168 20480]
-
blk.53.ffn_norm.weightF32[7168]
-
blk.53.attn_k.weightQ4_K[7168 1024]
-
blk.53.attn_output.weightQ4_K[7168 7168]
-
blk.53.attn_q.weightQ4_K[7168 7168]
-
blk.53.attn_v.weightQ6_K[7168 1024]
-
blk.54.attn_norm.weightF32[7168]
-
blk.54.ffn_down.weightQ6_K[20480 7168]
-
blk.54.ffn_gate.weightQ4_K[7168 20480]
-
blk.54.ffn_up.weightQ4_K[7168 20480]
-
blk.54.ffn_norm.weightF32[7168]
-
blk.54.attn_k.weightQ4_K[7168 1024]
-
blk.54.attn_output.weightQ4_K[7168 7168]
-
blk.54.attn_q.weightQ4_K[7168 7168]
-
blk.54.attn_v.weightQ6_K[7168 1024]
-
blk.55.ffn_gate.weightQ4_K[7168 20480]
-
blk.55.attn_k.weightQ4_K[7168 1024]
-
blk.55.attn_output.weightQ4_K[7168 7168]
-
blk.55.attn_q.weightQ4_K[7168 7168]
-
blk.55.attn_v.weightQ6_K[7168 1024]
-
blk.55.attn_norm.weightF32[7168]
-
blk.55.ffn_down.weightQ6_K[20480 7168]
-
blk.55.ffn_up.weightQ4_K[7168 20480]
-
blk.55.ffn_norm.weightF32[7168]
-
blk.56.attn_norm.weightF32[7168]
-
blk.56.ffn_down.weightQ6_K[20480 7168]
-
blk.56.ffn_gate.weightQ4_K[7168 20480]
-
blk.56.ffn_up.weightQ4_K[7168 20480]
-
blk.56.ffn_norm.weightF32[7168]
-
blk.56.attn_k.weightQ4_K[7168 1024]
-
blk.56.attn_output.weightQ4_K[7168 7168]
-
blk.56.attn_q.weightQ4_K[7168 7168]
-
blk.56.attn_v.weightQ6_K[7168 1024]
-
blk.57.attn_norm.weightF32[7168]
-
blk.57.ffn_down.weightQ6_K[20480 7168]
-
blk.57.ffn_gate.weightQ4_K[7168 20480]
-
blk.57.ffn_up.weightQ4_K[7168 20480]
-
blk.57.ffn_norm.weightF32[7168]
-
blk.57.attn_k.weightQ4_K[7168 1024]
-
blk.57.attn_output.weightQ4_K[7168 7168]
-
blk.57.attn_q.weightQ4_K[7168 7168]
-
blk.57.attn_v.weightQ6_K[7168 1024]
-
blk.58.attn_norm.weightF32[7168]
-
blk.58.ffn_down.weightQ6_K[20480 7168]
-
blk.58.ffn_gate.weightQ4_K[7168 20480]
-
blk.58.ffn_up.weightQ4_K[7168 20480]
-
blk.58.ffn_norm.weightF32[7168]
-
blk.58.attn_k.weightQ4_K[7168 1024]
-
blk.58.attn_output.weightQ4_K[7168 7168]
-
blk.58.attn_q.weightQ4_K[7168 7168]
-
blk.58.attn_v.weightQ6_K[7168 1024]
-
blk.59.ffn_gate.weightQ4_K[7168 20480]
-
blk.59.ffn_up.weightQ4_K[7168 20480]
-
blk.59.attn_k.weightQ4_K[7168 1024]
-
blk.59.attn_output.weightQ4_K[7168 7168]
-
blk.59.attn_q.weightQ4_K[7168 7168]
-
blk.59.attn_v.weightQ6_K[7168 1024]
-
blk.59.attn_norm.weightF32[7168]
-
blk.59.ffn_down.weightQ6_K[20480 7168]
-
blk.59.ffn_norm.weightF32[7168]
-
output.weightF16[7168 64000]
-
output_norm.weightF32[7168]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59