latest
24GB
dolphin-2.9.3-Yi-1.5-34B-32k-Q5_K_M
34B
25 Pulls Updated 2 months ago
5f5e48ef2ea2 · 24GB
-
quantize.imatrix.chunks_count146
-
quantize.imatrix.dataset/training_data/calibration_datav3.txt
-
quantize.imatrix.entries_count420
-
quantize.imatrix.file/models/dolphin-2.9.3-Yi-1.5-34B-32k-GGUF/dolphin-2.9.3-Yi-1.5-34B-32k.imatrix
-
general.architecturellama
-
general.file_typeQ5_K_M
-
llama.attention.head_count56
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-06
-
llama.block_count60
-
llama.context_length32768
-
llama.embedding_length7168
-
llama.feed_forward_length20480
-
llama.rope.dimension_count128
-
llama.rope.freq_base5e+06
-
llama.vocab_size64000
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixtrue
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id7
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[2 3 3 3 3 ...]
-
tokenizer.ggml.tokens[<unk> <|startoftext|> <|endoftext|> <|Human|> <|Assistant|> ...]
-
NameTypeShape
-
token_embd.weightQ5_K[7168 64000]
-
blk.0.attn_q.weightQ5_K[7168 7168]
-
blk.0.attn_k.weightQ5_K[7168 1024]
-
blk.0.attn_v.weightQ6_K[7168 1024]
-
blk.0.attn_output.weightQ5_K[7168 7168]
-
blk.0.ffn_gate.weightQ5_K[7168 20480]
-
blk.0.ffn_up.weightQ5_K[7168 20480]
-
blk.0.ffn_down.weightQ6_K[20480 7168]
-
blk.0.attn_norm.weightF32[7168]
-
blk.0.ffn_norm.weightF32[7168]
-
blk.1.attn_q.weightQ5_K[7168 7168]
-
blk.1.attn_k.weightQ5_K[7168 1024]
-
blk.1.attn_v.weightQ6_K[7168 1024]
-
blk.1.attn_output.weightQ5_K[7168 7168]
-
blk.1.ffn_gate.weightQ5_K[7168 20480]
-
blk.1.ffn_up.weightQ5_K[7168 20480]
-
blk.1.ffn_down.weightQ6_K[20480 7168]
-
blk.1.attn_norm.weightF32[7168]
-
blk.1.ffn_norm.weightF32[7168]
-
blk.2.attn_q.weightQ5_K[7168 7168]
-
blk.2.attn_k.weightQ5_K[7168 1024]
-
blk.2.attn_v.weightQ6_K[7168 1024]
-
blk.2.attn_output.weightQ5_K[7168 7168]
-
blk.2.ffn_gate.weightQ5_K[7168 20480]
-
blk.2.ffn_up.weightQ5_K[7168 20480]
-
blk.2.ffn_down.weightQ6_K[20480 7168]
-
blk.2.attn_norm.weightF32[7168]
-
blk.2.ffn_norm.weightF32[7168]
-
blk.3.attn_q.weightQ5_K[7168 7168]
-
blk.3.attn_k.weightQ5_K[7168 1024]
-
blk.3.attn_v.weightQ6_K[7168 1024]
-
blk.3.attn_output.weightQ5_K[7168 7168]
-
blk.3.ffn_gate.weightQ5_K[7168 20480]
-
blk.3.ffn_up.weightQ5_K[7168 20480]
-
blk.3.ffn_down.weightQ6_K[20480 7168]
-
blk.3.attn_norm.weightF32[7168]
-
blk.3.ffn_norm.weightF32[7168]
-
blk.4.attn_q.weightQ5_K[7168 7168]
-
blk.4.attn_k.weightQ5_K[7168 1024]
-
blk.4.attn_v.weightQ6_K[7168 1024]
-
blk.4.attn_output.weightQ5_K[7168 7168]
-
blk.4.ffn_gate.weightQ5_K[7168 20480]
-
blk.4.ffn_up.weightQ5_K[7168 20480]
-
blk.4.ffn_down.weightQ6_K[20480 7168]
-
blk.4.attn_norm.weightF32[7168]
-
blk.4.ffn_norm.weightF32[7168]
-
blk.5.attn_q.weightQ5_K[7168 7168]
-
blk.5.attn_k.weightQ5_K[7168 1024]
-
blk.5.attn_v.weightQ6_K[7168 1024]
-
blk.5.attn_output.weightQ5_K[7168 7168]
-
blk.5.ffn_gate.weightQ5_K[7168 20480]
-
blk.5.ffn_up.weightQ5_K[7168 20480]
-
blk.5.ffn_down.weightQ6_K[20480 7168]
-
blk.5.attn_norm.weightF32[7168]
-
blk.5.ffn_norm.weightF32[7168]
-
blk.6.attn_q.weightQ5_K[7168 7168]
-
blk.6.attn_k.weightQ5_K[7168 1024]
-
blk.6.attn_v.weightQ6_K[7168 1024]
-
blk.6.attn_output.weightQ5_K[7168 7168]
-
blk.6.ffn_gate.weightQ5_K[7168 20480]
-
blk.6.ffn_up.weightQ5_K[7168 20480]
-
blk.6.ffn_down.weightQ6_K[20480 7168]
-
blk.6.attn_norm.weightF32[7168]
-
blk.6.ffn_norm.weightF32[7168]
-
blk.7.attn_q.weightQ5_K[7168 7168]
-
blk.7.attn_k.weightQ5_K[7168 1024]
-
blk.7.attn_v.weightQ5_K[7168 1024]
-
blk.7.attn_output.weightQ5_K[7168 7168]
-
blk.7.ffn_gate.weightQ5_K[7168 20480]
-
blk.7.ffn_up.weightQ5_K[7168 20480]
-
blk.7.ffn_down.weightQ5_K[20480 7168]
-
blk.7.attn_norm.weightF32[7168]
-
blk.7.ffn_norm.weightF32[7168]
-
blk.8.attn_q.weightQ5_K[7168 7168]
-
blk.8.attn_k.weightQ5_K[7168 1024]
-
blk.8.attn_v.weightQ5_K[7168 1024]
-
blk.8.attn_output.weightQ5_K[7168 7168]
-
blk.8.ffn_gate.weightQ5_K[7168 20480]
-
blk.8.ffn_up.weightQ5_K[7168 20480]
-
blk.8.ffn_down.weightQ5_K[20480 7168]
-
blk.8.attn_norm.weightF32[7168]
-
blk.8.ffn_norm.weightF32[7168]
-
blk.9.attn_q.weightQ5_K[7168 7168]
-
blk.9.attn_k.weightQ5_K[7168 1024]
-
blk.9.attn_v.weightQ6_K[7168 1024]
-
blk.9.attn_output.weightQ5_K[7168 7168]
-
blk.9.ffn_gate.weightQ5_K[7168 20480]
-
blk.9.ffn_up.weightQ5_K[7168 20480]
-
blk.9.ffn_down.weightQ6_K[20480 7168]
-
blk.9.attn_norm.weightF32[7168]
-
blk.9.ffn_norm.weightF32[7168]
-
blk.10.attn_q.weightQ5_K[7168 7168]
-
blk.10.attn_k.weightQ5_K[7168 1024]
-
blk.10.attn_v.weightQ5_K[7168 1024]
-
blk.10.attn_output.weightQ5_K[7168 7168]
-
blk.10.ffn_gate.weightQ5_K[7168 20480]
-
blk.10.ffn_up.weightQ5_K[7168 20480]
-
blk.10.ffn_down.weightQ5_K[20480 7168]
-
blk.10.attn_norm.weightF32[7168]
-
blk.10.ffn_norm.weightF32[7168]
-
blk.11.attn_q.weightQ5_K[7168 7168]
-
blk.11.attn_k.weightQ5_K[7168 1024]
-
blk.11.attn_v.weightQ5_K[7168 1024]
-
blk.11.attn_output.weightQ5_K[7168 7168]
-
blk.11.ffn_gate.weightQ5_K[7168 20480]
-
blk.11.ffn_up.weightQ5_K[7168 20480]
-
blk.11.ffn_down.weightQ5_K[20480 7168]
-
blk.11.attn_norm.weightF32[7168]
-
blk.11.ffn_norm.weightF32[7168]
-
blk.12.attn_q.weightQ5_K[7168 7168]
-
blk.12.attn_k.weightQ5_K[7168 1024]
-
blk.12.attn_v.weightQ6_K[7168 1024]
-
blk.12.attn_output.weightQ5_K[7168 7168]
-
blk.12.ffn_gate.weightQ5_K[7168 20480]
-
blk.12.ffn_up.weightQ5_K[7168 20480]
-
blk.12.ffn_down.weightQ6_K[20480 7168]
-
blk.12.attn_norm.weightF32[7168]
-
blk.12.ffn_norm.weightF32[7168]
-
blk.13.attn_q.weightQ5_K[7168 7168]
-
blk.13.attn_k.weightQ5_K[7168 1024]
-
blk.13.attn_v.weightQ5_K[7168 1024]
-
blk.13.attn_output.weightQ5_K[7168 7168]
-
blk.13.ffn_gate.weightQ5_K[7168 20480]
-
blk.13.ffn_up.weightQ5_K[7168 20480]
-
blk.13.ffn_down.weightQ5_K[20480 7168]
-
blk.13.attn_norm.weightF32[7168]
-
blk.13.ffn_norm.weightF32[7168]
-
blk.14.attn_q.weightQ5_K[7168 7168]
-
blk.14.attn_k.weightQ5_K[7168 1024]
-
blk.14.attn_v.weightQ5_K[7168 1024]
-
blk.14.attn_output.weightQ5_K[7168 7168]
-
blk.14.ffn_gate.weightQ5_K[7168 20480]
-
blk.14.ffn_up.weightQ5_K[7168 20480]
-
blk.14.ffn_down.weightQ5_K[20480 7168]
-
blk.14.attn_norm.weightF32[7168]
-
blk.14.ffn_norm.weightF32[7168]
-
blk.15.attn_q.weightQ5_K[7168 7168]
-
blk.15.attn_k.weightQ5_K[7168 1024]
-
blk.15.attn_v.weightQ6_K[7168 1024]
-
blk.15.attn_output.weightQ5_K[7168 7168]
-
blk.15.ffn_gate.weightQ5_K[7168 20480]
-
blk.15.ffn_up.weightQ5_K[7168 20480]
-
blk.15.ffn_down.weightQ6_K[20480 7168]
-
blk.15.attn_norm.weightF32[7168]
-
blk.15.ffn_norm.weightF32[7168]
-
blk.16.attn_q.weightQ5_K[7168 7168]
-
blk.16.attn_k.weightQ5_K[7168 1024]
-
blk.16.attn_v.weightQ5_K[7168 1024]
-
blk.16.attn_output.weightQ5_K[7168 7168]
-
blk.16.ffn_gate.weightQ5_K[7168 20480]
-
blk.16.ffn_up.weightQ5_K[7168 20480]
-
blk.16.ffn_down.weightQ5_K[20480 7168]
-
blk.16.attn_norm.weightF32[7168]
-
blk.16.ffn_norm.weightF32[7168]
-
blk.17.attn_q.weightQ5_K[7168 7168]
-
blk.17.attn_k.weightQ5_K[7168 1024]
-
blk.17.attn_v.weightQ5_K[7168 1024]
-
blk.17.attn_output.weightQ5_K[7168 7168]
-
blk.17.ffn_gate.weightQ5_K[7168 20480]
-
blk.17.ffn_up.weightQ5_K[7168 20480]
-
blk.17.ffn_down.weightQ5_K[20480 7168]
-
blk.17.attn_norm.weightF32[7168]
-
blk.17.ffn_norm.weightF32[7168]
-
blk.18.attn_q.weightQ5_K[7168 7168]
-
blk.18.attn_k.weightQ5_K[7168 1024]
-
blk.18.attn_v.weightQ6_K[7168 1024]
-
blk.18.attn_output.weightQ5_K[7168 7168]
-
blk.18.ffn_gate.weightQ5_K[7168 20480]
-
blk.18.ffn_up.weightQ5_K[7168 20480]
-
blk.18.ffn_down.weightQ6_K[20480 7168]
-
blk.18.attn_norm.weightF32[7168]
-
blk.18.ffn_norm.weightF32[7168]
-
blk.19.attn_q.weightQ5_K[7168 7168]
-
blk.19.attn_k.weightQ5_K[7168 1024]
-
blk.19.attn_v.weightQ5_K[7168 1024]
-
blk.19.attn_output.weightQ5_K[7168 7168]
-
blk.19.ffn_gate.weightQ5_K[7168 20480]
-
blk.19.ffn_up.weightQ5_K[7168 20480]
-
blk.19.ffn_down.weightQ5_K[20480 7168]
-
blk.19.attn_norm.weightF32[7168]
-
blk.19.ffn_norm.weightF32[7168]
-
blk.20.attn_q.weightQ5_K[7168 7168]
-
blk.20.attn_k.weightQ5_K[7168 1024]
-
blk.20.attn_v.weightQ5_K[7168 1024]
-
blk.20.attn_output.weightQ5_K[7168 7168]
-
blk.20.ffn_gate.weightQ5_K[7168 20480]
-
blk.20.ffn_up.weightQ5_K[7168 20480]
-
blk.20.ffn_down.weightQ5_K[20480 7168]
-
blk.20.attn_norm.weightF32[7168]
-
blk.20.ffn_norm.weightF32[7168]
-
blk.21.attn_q.weightQ5_K[7168 7168]
-
blk.21.attn_k.weightQ5_K[7168 1024]
-
blk.21.attn_v.weightQ6_K[7168 1024]
-
blk.21.attn_output.weightQ5_K[7168 7168]
-
blk.21.ffn_gate.weightQ5_K[7168 20480]
-
blk.21.ffn_up.weightQ5_K[7168 20480]
-
blk.21.ffn_down.weightQ6_K[20480 7168]
-
blk.21.attn_norm.weightF32[7168]
-
blk.21.ffn_norm.weightF32[7168]
-
blk.22.attn_q.weightQ5_K[7168 7168]
-
blk.22.attn_k.weightQ5_K[7168 1024]
-
blk.22.attn_v.weightQ5_K[7168 1024]
-
blk.22.attn_output.weightQ5_K[7168 7168]
-
blk.22.ffn_gate.weightQ5_K[7168 20480]
-
blk.22.ffn_up.weightQ5_K[7168 20480]
-
blk.22.ffn_down.weightQ5_K[20480 7168]
-
blk.22.attn_norm.weightF32[7168]
-
blk.22.ffn_norm.weightF32[7168]
-
blk.23.attn_q.weightQ5_K[7168 7168]
-
blk.23.attn_k.weightQ5_K[7168 1024]
-
blk.23.attn_v.weightQ5_K[7168 1024]
-
blk.23.attn_output.weightQ5_K[7168 7168]
-
blk.23.ffn_gate.weightQ5_K[7168 20480]
-
blk.23.ffn_up.weightQ5_K[7168 20480]
-
blk.23.ffn_down.weightQ5_K[20480 7168]
-
blk.23.attn_norm.weightF32[7168]
-
blk.23.ffn_norm.weightF32[7168]
-
blk.24.attn_q.weightQ5_K[7168 7168]
-
blk.24.attn_k.weightQ5_K[7168 1024]
-
blk.24.attn_v.weightQ6_K[7168 1024]
-
blk.24.attn_output.weightQ5_K[7168 7168]
-
blk.24.ffn_gate.weightQ5_K[7168 20480]
-
blk.24.ffn_up.weightQ5_K[7168 20480]
-
blk.24.ffn_down.weightQ6_K[20480 7168]
-
blk.24.attn_norm.weightF32[7168]
-
blk.24.ffn_norm.weightF32[7168]
-
blk.25.attn_q.weightQ5_K[7168 7168]
-
blk.25.attn_k.weightQ5_K[7168 1024]
-
blk.25.attn_v.weightQ5_K[7168 1024]
-
blk.25.attn_output.weightQ5_K[7168 7168]
-
blk.25.ffn_gate.weightQ5_K[7168 20480]
-
blk.25.ffn_up.weightQ5_K[7168 20480]
-
blk.25.ffn_down.weightQ5_K[20480 7168]
-
blk.25.attn_norm.weightF32[7168]
-
blk.25.ffn_norm.weightF32[7168]
-
blk.26.attn_q.weightQ5_K[7168 7168]
-
blk.26.attn_k.weightQ5_K[7168 1024]
-
blk.26.attn_v.weightQ5_K[7168 1024]
-
blk.26.attn_output.weightQ5_K[7168 7168]
-
blk.26.ffn_gate.weightQ5_K[7168 20480]
-
blk.26.ffn_up.weightQ5_K[7168 20480]
-
blk.26.ffn_down.weightQ5_K[20480 7168]
-
blk.26.attn_norm.weightF32[7168]
-
blk.26.ffn_norm.weightF32[7168]
-
blk.27.attn_q.weightQ5_K[7168 7168]
-
blk.27.attn_k.weightQ5_K[7168 1024]
-
blk.27.attn_v.weightQ6_K[7168 1024]
-
blk.27.attn_output.weightQ5_K[7168 7168]
-
blk.27.ffn_gate.weightQ5_K[7168 20480]
-
blk.27.ffn_up.weightQ5_K[7168 20480]
-
blk.27.ffn_down.weightQ6_K[20480 7168]
-
blk.27.attn_norm.weightF32[7168]
-
blk.27.ffn_norm.weightF32[7168]
-
blk.28.attn_q.weightQ5_K[7168 7168]
-
blk.28.attn_k.weightQ5_K[7168 1024]
-
blk.28.attn_v.weightQ5_K[7168 1024]
-
blk.28.attn_output.weightQ5_K[7168 7168]
-
blk.28.ffn_gate.weightQ5_K[7168 20480]
-
blk.28.ffn_up.weightQ5_K[7168 20480]
-
blk.28.ffn_down.weightQ5_K[20480 7168]
-
blk.28.attn_norm.weightF32[7168]
-
blk.28.ffn_norm.weightF32[7168]
-
blk.29.attn_q.weightQ5_K[7168 7168]
-
blk.29.attn_k.weightQ5_K[7168 1024]
-
blk.29.attn_v.weightQ5_K[7168 1024]
-
blk.29.attn_output.weightQ5_K[7168 7168]
-
blk.29.ffn_gate.weightQ5_K[7168 20480]
-
blk.29.ffn_up.weightQ5_K[7168 20480]
-
blk.29.ffn_down.weightQ5_K[20480 7168]
-
blk.29.attn_norm.weightF32[7168]
-
blk.29.ffn_norm.weightF32[7168]
-
blk.30.attn_q.weightQ5_K[7168 7168]
-
blk.30.attn_k.weightQ5_K[7168 1024]
-
blk.30.attn_v.weightQ6_K[7168 1024]
-
blk.30.attn_output.weightQ5_K[7168 7168]
-
blk.30.ffn_gate.weightQ5_K[7168 20480]
-
blk.30.ffn_up.weightQ5_K[7168 20480]
-
blk.30.ffn_down.weightQ6_K[20480 7168]
-
blk.30.attn_norm.weightF32[7168]
-
blk.30.ffn_norm.weightF32[7168]
-
blk.31.attn_q.weightQ5_K[7168 7168]
-
blk.31.attn_k.weightQ5_K[7168 1024]
-
blk.31.attn_v.weightQ5_K[7168 1024]
-
blk.31.attn_output.weightQ5_K[7168 7168]
-
blk.31.ffn_gate.weightQ5_K[7168 20480]
-
blk.31.ffn_up.weightQ5_K[7168 20480]
-
blk.31.ffn_down.weightQ5_K[20480 7168]
-
blk.31.attn_norm.weightF32[7168]
-
blk.31.ffn_norm.weightF32[7168]
-
blk.32.attn_q.weightQ5_K[7168 7168]
-
blk.32.attn_k.weightQ5_K[7168 1024]
-
blk.32.attn_v.weightQ5_K[7168 1024]
-
blk.32.attn_output.weightQ5_K[7168 7168]
-
blk.32.ffn_gate.weightQ5_K[7168 20480]
-
blk.32.ffn_up.weightQ5_K[7168 20480]
-
blk.32.ffn_down.weightQ5_K[20480 7168]
-
blk.32.attn_norm.weightF32[7168]
-
blk.32.ffn_norm.weightF32[7168]
-
blk.33.attn_q.weightQ5_K[7168 7168]
-
blk.33.attn_k.weightQ5_K[7168 1024]
-
blk.33.attn_v.weightQ6_K[7168 1024]
-
blk.33.attn_output.weightQ5_K[7168 7168]
-
blk.33.ffn_gate.weightQ5_K[7168 20480]
-
blk.33.ffn_up.weightQ5_K[7168 20480]
-
blk.33.ffn_down.weightQ6_K[20480 7168]
-
blk.33.attn_norm.weightF32[7168]
-
blk.33.ffn_norm.weightF32[7168]
-
blk.34.attn_q.weightQ5_K[7168 7168]
-
blk.34.attn_k.weightQ5_K[7168 1024]
-
blk.34.attn_v.weightQ5_K[7168 1024]
-
blk.34.attn_output.weightQ5_K[7168 7168]
-
blk.34.ffn_gate.weightQ5_K[7168 20480]
-
blk.34.ffn_up.weightQ5_K[7168 20480]
-
blk.34.ffn_down.weightQ5_K[20480 7168]
-
blk.34.attn_norm.weightF32[7168]
-
blk.34.ffn_norm.weightF32[7168]
-
blk.35.attn_q.weightQ5_K[7168 7168]
-
blk.35.attn_k.weightQ5_K[7168 1024]
-
blk.35.attn_v.weightQ5_K[7168 1024]
-
blk.35.attn_output.weightQ5_K[7168 7168]
-
blk.35.ffn_gate.weightQ5_K[7168 20480]
-
blk.35.ffn_up.weightQ5_K[7168 20480]
-
blk.35.ffn_down.weightQ5_K[20480 7168]
-
blk.35.attn_norm.weightF32[7168]
-
blk.35.ffn_norm.weightF32[7168]
-
blk.36.attn_q.weightQ5_K[7168 7168]
-
blk.36.attn_k.weightQ5_K[7168 1024]
-
blk.36.attn_v.weightQ6_K[7168 1024]
-
blk.36.attn_output.weightQ5_K[7168 7168]
-
blk.36.ffn_gate.weightQ5_K[7168 20480]
-
blk.36.ffn_up.weightQ5_K[7168 20480]
-
blk.36.ffn_down.weightQ6_K[20480 7168]
-
blk.36.attn_norm.weightF32[7168]
-
blk.36.ffn_norm.weightF32[7168]
-
blk.37.attn_q.weightQ5_K[7168 7168]
-
blk.37.attn_k.weightQ5_K[7168 1024]
-
blk.37.attn_v.weightQ5_K[7168 1024]
-
blk.37.attn_output.weightQ5_K[7168 7168]
-
blk.37.ffn_gate.weightQ5_K[7168 20480]
-
blk.37.ffn_up.weightQ5_K[7168 20480]
-
blk.37.ffn_down.weightQ5_K[20480 7168]
-
blk.37.attn_norm.weightF32[7168]
-
blk.37.ffn_norm.weightF32[7168]
-
blk.38.attn_q.weightQ5_K[7168 7168]
-
blk.38.attn_k.weightQ5_K[7168 1024]
-
blk.38.attn_v.weightQ5_K[7168 1024]
-
blk.38.attn_output.weightQ5_K[7168 7168]
-
blk.38.ffn_gate.weightQ5_K[7168 20480]
-
blk.38.ffn_up.weightQ5_K[7168 20480]
-
blk.38.ffn_down.weightQ5_K[20480 7168]
-
blk.38.attn_norm.weightF32[7168]
-
blk.38.ffn_norm.weightF32[7168]
-
blk.39.attn_q.weightQ5_K[7168 7168]
-
blk.39.attn_k.weightQ5_K[7168 1024]
-
blk.39.attn_v.weightQ6_K[7168 1024]
-
blk.39.attn_output.weightQ5_K[7168 7168]
-
blk.39.ffn_gate.weightQ5_K[7168 20480]
-
blk.39.ffn_up.weightQ5_K[7168 20480]
-
blk.39.ffn_down.weightQ6_K[20480 7168]
-
blk.39.attn_norm.weightF32[7168]
-
blk.39.ffn_norm.weightF32[7168]
-
blk.40.attn_q.weightQ5_K[7168 7168]
-
blk.40.attn_k.weightQ5_K[7168 1024]
-
blk.40.attn_v.weightQ5_K[7168 1024]
-
blk.40.attn_output.weightQ5_K[7168 7168]
-
blk.40.ffn_gate.weightQ5_K[7168 20480]
-
blk.40.ffn_up.weightQ5_K[7168 20480]
-
blk.40.ffn_down.weightQ5_K[20480 7168]
-
blk.40.attn_norm.weightF32[7168]
-
blk.40.ffn_norm.weightF32[7168]
-
blk.41.attn_q.weightQ5_K[7168 7168]
-
blk.41.attn_k.weightQ5_K[7168 1024]
-
blk.41.attn_v.weightQ5_K[7168 1024]
-
blk.41.attn_output.weightQ5_K[7168 7168]
-
blk.41.ffn_gate.weightQ5_K[7168 20480]
-
blk.41.ffn_up.weightQ5_K[7168 20480]
-
blk.41.ffn_down.weightQ5_K[20480 7168]
-
blk.41.attn_norm.weightF32[7168]
-
blk.41.ffn_norm.weightF32[7168]
-
blk.42.attn_q.weightQ5_K[7168 7168]
-
blk.42.attn_k.weightQ5_K[7168 1024]
-
blk.42.attn_v.weightQ6_K[7168 1024]
-
blk.42.attn_output.weightQ5_K[7168 7168]
-
blk.42.ffn_gate.weightQ5_K[7168 20480]
-
blk.42.ffn_up.weightQ5_K[7168 20480]
-
blk.42.ffn_down.weightQ6_K[20480 7168]
-
blk.42.attn_norm.weightF32[7168]
-
blk.42.ffn_norm.weightF32[7168]
-
blk.43.attn_q.weightQ5_K[7168 7168]
-
blk.43.attn_k.weightQ5_K[7168 1024]
-
blk.43.attn_v.weightQ5_K[7168 1024]
-
blk.43.attn_output.weightQ5_K[7168 7168]
-
blk.43.ffn_gate.weightQ5_K[7168 20480]
-
blk.43.ffn_up.weightQ5_K[7168 20480]
-
blk.43.ffn_down.weightQ5_K[20480 7168]
-
blk.43.attn_norm.weightF32[7168]
-
blk.43.ffn_norm.weightF32[7168]
-
blk.44.attn_q.weightQ5_K[7168 7168]
-
blk.44.attn_k.weightQ5_K[7168 1024]
-
blk.44.attn_v.weightQ5_K[7168 1024]
-
blk.44.attn_output.weightQ5_K[7168 7168]
-
blk.44.ffn_gate.weightQ5_K[7168 20480]
-
blk.44.ffn_up.weightQ5_K[7168 20480]
-
blk.44.ffn_down.weightQ5_K[20480 7168]
-
blk.44.attn_norm.weightF32[7168]
-
blk.44.ffn_norm.weightF32[7168]
-
blk.45.attn_q.weightQ5_K[7168 7168]
-
blk.45.attn_k.weightQ5_K[7168 1024]
-
blk.45.attn_v.weightQ6_K[7168 1024]
-
blk.45.attn_output.weightQ5_K[7168 7168]
-
blk.45.ffn_gate.weightQ5_K[7168 20480]
-
blk.45.ffn_up.weightQ5_K[7168 20480]
-
blk.45.ffn_down.weightQ6_K[20480 7168]
-
blk.45.attn_norm.weightF32[7168]
-
blk.45.ffn_norm.weightF32[7168]
-
blk.46.attn_q.weightQ5_K[7168 7168]
-
blk.46.attn_k.weightQ5_K[7168 1024]
-
blk.46.attn_v.weightQ5_K[7168 1024]
-
blk.46.attn_output.weightQ5_K[7168 7168]
-
blk.46.ffn_gate.weightQ5_K[7168 20480]
-
blk.46.ffn_up.weightQ5_K[7168 20480]
-
blk.46.ffn_down.weightQ5_K[20480 7168]
-
blk.46.attn_norm.weightF32[7168]
-
blk.46.ffn_norm.weightF32[7168]
-
blk.47.attn_q.weightQ5_K[7168 7168]
-
blk.47.attn_k.weightQ5_K[7168 1024]
-
blk.47.attn_v.weightQ5_K[7168 1024]
-
blk.47.attn_output.weightQ5_K[7168 7168]
-
blk.47.ffn_gate.weightQ5_K[7168 20480]
-
blk.47.ffn_up.weightQ5_K[7168 20480]
-
blk.47.ffn_down.weightQ5_K[20480 7168]
-
blk.47.attn_norm.weightF32[7168]
-
blk.47.ffn_norm.weightF32[7168]
-
blk.48.attn_q.weightQ5_K[7168 7168]
-
blk.48.attn_k.weightQ5_K[7168 1024]
-
blk.48.attn_v.weightQ6_K[7168 1024]
-
blk.48.attn_output.weightQ5_K[7168 7168]
-
blk.48.ffn_gate.weightQ5_K[7168 20480]
-
blk.48.ffn_up.weightQ5_K[7168 20480]
-
blk.48.ffn_down.weightQ6_K[20480 7168]
-
blk.48.attn_norm.weightF32[7168]
-
blk.48.ffn_norm.weightF32[7168]
-
blk.49.attn_q.weightQ5_K[7168 7168]
-
blk.49.attn_k.weightQ5_K[7168 1024]
-
blk.49.attn_v.weightQ5_K[7168 1024]
-
blk.49.attn_output.weightQ5_K[7168 7168]
-
blk.49.ffn_gate.weightQ5_K[7168 20480]
-
blk.49.ffn_up.weightQ5_K[7168 20480]
-
blk.49.ffn_down.weightQ5_K[20480 7168]
-
blk.49.attn_norm.weightF32[7168]
-
blk.49.ffn_norm.weightF32[7168]
-
blk.50.attn_q.weightQ5_K[7168 7168]
-
blk.50.attn_k.weightQ5_K[7168 1024]
-
blk.50.attn_v.weightQ5_K[7168 1024]
-
blk.50.attn_output.weightQ5_K[7168 7168]
-
blk.50.ffn_gate.weightQ5_K[7168 20480]
-
blk.50.ffn_up.weightQ5_K[7168 20480]
-
blk.50.ffn_down.weightQ5_K[20480 7168]
-
blk.50.attn_norm.weightF32[7168]
-
blk.50.ffn_norm.weightF32[7168]
-
blk.51.attn_q.weightQ5_K[7168 7168]
-
blk.51.attn_k.weightQ5_K[7168 1024]
-
blk.51.attn_v.weightQ6_K[7168 1024]
-
blk.51.attn_output.weightQ5_K[7168 7168]
-
blk.51.ffn_gate.weightQ5_K[7168 20480]
-
blk.51.ffn_up.weightQ5_K[7168 20480]
-
blk.51.ffn_down.weightQ6_K[20480 7168]
-
blk.51.attn_norm.weightF32[7168]
-
blk.51.ffn_norm.weightF32[7168]
-
blk.52.attn_q.weightQ5_K[7168 7168]
-
blk.52.attn_k.weightQ5_K[7168 1024]
-
blk.52.attn_v.weightQ6_K[7168 1024]
-
blk.52.attn_output.weightQ5_K[7168 7168]
-
blk.52.ffn_gate.weightQ5_K[7168 20480]
-
blk.52.ffn_up.weightQ5_K[7168 20480]
-
blk.52.ffn_down.weightQ6_K[20480 7168]
-
blk.52.attn_norm.weightF32[7168]
-
blk.52.ffn_norm.weightF32[7168]
-
blk.53.attn_q.weightQ5_K[7168 7168]
-
blk.53.attn_k.weightQ5_K[7168 1024]
-
blk.53.attn_v.weightQ6_K[7168 1024]
-
blk.53.attn_output.weightQ5_K[7168 7168]
-
blk.53.ffn_gate.weightQ5_K[7168 20480]
-
blk.53.ffn_up.weightQ5_K[7168 20480]
-
blk.53.ffn_down.weightQ6_K[20480 7168]
-
blk.53.attn_norm.weightF32[7168]
-
blk.53.ffn_norm.weightF32[7168]
-
blk.54.attn_q.weightQ5_K[7168 7168]
-
blk.54.attn_k.weightQ5_K[7168 1024]
-
blk.54.attn_v.weightQ6_K[7168 1024]
-
blk.54.attn_output.weightQ5_K[7168 7168]
-
blk.54.ffn_gate.weightQ5_K[7168 20480]
-
blk.54.ffn_up.weightQ5_K[7168 20480]
-
blk.54.ffn_down.weightQ6_K[20480 7168]
-
blk.54.attn_norm.weightF32[7168]
-
blk.54.ffn_norm.weightF32[7168]
-
blk.55.attn_q.weightQ5_K[7168 7168]
-
blk.55.attn_k.weightQ5_K[7168 1024]
-
blk.55.attn_v.weightQ6_K[7168 1024]
-
blk.55.attn_output.weightQ5_K[7168 7168]
-
blk.55.ffn_gate.weightQ5_K[7168 20480]
-
blk.55.ffn_up.weightQ5_K[7168 20480]
-
blk.55.ffn_down.weightQ6_K[20480 7168]
-
blk.55.attn_norm.weightF32[7168]
-
blk.55.ffn_norm.weightF32[7168]
-
blk.56.attn_q.weightQ5_K[7168 7168]
-
blk.56.attn_k.weightQ5_K[7168 1024]
-
blk.56.attn_v.weightQ6_K[7168 1024]
-
blk.56.attn_output.weightQ5_K[7168 7168]
-
blk.56.ffn_gate.weightQ5_K[7168 20480]
-
blk.56.ffn_up.weightQ5_K[7168 20480]
-
blk.56.ffn_down.weightQ6_K[20480 7168]
-
blk.56.attn_norm.weightF32[7168]
-
blk.56.ffn_norm.weightF32[7168]
-
blk.57.attn_q.weightQ5_K[7168 7168]
-
blk.57.attn_k.weightQ5_K[7168 1024]
-
blk.57.attn_v.weightQ6_K[7168 1024]
-
blk.57.attn_output.weightQ5_K[7168 7168]
-
blk.57.ffn_gate.weightQ5_K[7168 20480]
-
blk.57.ffn_up.weightQ5_K[7168 20480]
-
blk.57.ffn_down.weightQ6_K[20480 7168]
-
blk.57.attn_norm.weightF32[7168]
-
blk.57.ffn_norm.weightF32[7168]
-
blk.58.attn_q.weightQ5_K[7168 7168]
-
blk.58.attn_k.weightQ5_K[7168 1024]
-
blk.58.attn_v.weightQ6_K[7168 1024]
-
blk.58.attn_output.weightQ5_K[7168 7168]
-
blk.58.ffn_gate.weightQ5_K[7168 20480]
-
blk.58.ffn_up.weightQ5_K[7168 20480]
-
blk.58.ffn_down.weightQ6_K[20480 7168]
-
blk.58.attn_norm.weightF32[7168]
-
blk.58.ffn_norm.weightF32[7168]
-
blk.59.attn_q.weightQ5_K[7168 7168]
-
blk.59.attn_k.weightQ5_K[7168 1024]
-
blk.59.attn_v.weightQ6_K[7168 1024]
-
blk.59.attn_output.weightQ5_K[7168 7168]
-
blk.59.ffn_gate.weightQ5_K[7168 20480]
-
blk.59.ffn_up.weightQ5_K[7168 20480]
-
blk.59.ffn_down.weightQ6_K[20480 7168]
-
blk.59.attn_norm.weightF32[7168]
-
blk.59.ffn_norm.weightF32[7168]
-
output_norm.weightF32[7168]
-
output.weightQ6_K[7168 64000]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59