thanks to bartowski for quants on HF
140 Pulls Updated 5 months ago
e40c20df4eff · 7.5GB
-
general.architecturellama
-
general.file_type30
-
general.namedolphin-2.9.2-Phi-3-Medium
-
general.quantization_version2
-
llama.attention.head_count40
-
llama.attention.head_count_kv10
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count40
-
llama.context_length4096
-
llama.embedding_length5120
-
llama.feed_forward_length17920
-
llama.rope.dimension_count128
-
llama.rope.freq_base10000
-
llama.vocab_size32064
-
quantize.imatrix.chunks_count151
-
quantize.imatrix.dataset/training_data/calibration_datav3.txt
-
quantize.imatrix.entries_count280
-
quantize.imatrix.file/models/dolphin-2.9.2-Phi-3-Medium-GGUF/dolphin-2.9.2-Phi-3-Medium.imatrix
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id32011
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id32009
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[0, 0, 0, 0, 0, ...]
-
tokenizer.ggml.token_type[2, 3, 3, 6, 6, ...]
-
tokenizer.ggml.tokens[<unk>, <s>, </s>, <0x00>, <0x01>, ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weight(!unknown_type 23!)[5120, 32064]
-
blk.0.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.0.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.0.attn_v.weightQ5_K[5120, 1280]
-
blk.0.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.0.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.0.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.1.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.1.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.1.attn_v.weightQ5_K[5120, 1280]
-
blk.1.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.1.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.2.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.2.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.2.attn_v.weightQ5_K[5120, 1280]
-
blk.2.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.2.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.2.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.3.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.3.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.3.attn_v.weightQ5_K[5120, 1280]
-
blk.3.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.3.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.3.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.4.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.4.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.4.attn_v.weightQ5_K[5120, 1280]
-
blk.4.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.4.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.4.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.5.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.5.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.5.attn_v.weightQ5_K[5120, 1280]
-
blk.5.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.5.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.6.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.6.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.6.attn_v.weightQ5_K[5120, 1280]
-
blk.6.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.6.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.6.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.7.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.7.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.7.attn_v.weightQ5_K[5120, 1280]
-
blk.7.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.7.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.8.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.8.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.8.attn_v.weightQ5_K[5120, 1280]
-
blk.8.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.8.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.8.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.9.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.9.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.9.attn_v.weightQ5_K[5120, 1280]
-
blk.9.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.9.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.10.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.10.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.10.attn_v.weightQ5_K[5120, 1280]
-
blk.10.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.10.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.10.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.11.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.11.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.11.attn_v.weightQ5_K[5120, 1280]
-
blk.11.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.11.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.12.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.12.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.12.attn_v.weightQ5_K[5120, 1280]
-
blk.12.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.12.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.12.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.13.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.13.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.13.attn_v.weightQ5_K[5120, 1280]
-
blk.13.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.13.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.13.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.14.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.14.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.14.attn_v.weightQ5_K[5120, 1280]
-
blk.14.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.14.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.14.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.15.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.15.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.15.attn_v.weightQ5_K[5120, 1280]
-
blk.15.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.15.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.15.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.16.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.16.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.16.attn_v.weightQ5_K[5120, 1280]
-
blk.16.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.16.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.16.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.17.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.17.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.17.attn_v.weightQ5_K[5120, 1280]
-
blk.17.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.17.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.18.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.18.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.18.attn_v.weightQ5_K[5120, 1280]
-
blk.18.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.18.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.18.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.19.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.19.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.19.attn_v.weightQ5_K[5120, 1280]
-
blk.19.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.19.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.20.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.20.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.20.attn_v.weightQ5_K[5120, 1280]
-
blk.20.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.20.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.20.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.21.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.21.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.21.attn_v.weightQ5_K[5120, 1280]
-
blk.21.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.21.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.21.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.22.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.22.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.22.attn_v.weightQ5_K[5120, 1280]
-
blk.22.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.22.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.22.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.23.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.23.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.23.attn_v.weightQ5_K[5120, 1280]
-
blk.23.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.23.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.23.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.24.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.24.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.24.attn_v.weightQ5_K[5120, 1280]
-
blk.24.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.24.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.24.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.25.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.25.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.25.attn_v.weightQ5_K[5120, 1280]
-
blk.25.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.25.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.26.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.26.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.26.attn_v.weightQ5_K[5120, 1280]
-
blk.26.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.26.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.26.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.27.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.27.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.27.attn_v.weightQ5_K[5120, 1280]
-
blk.27.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.27.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.28.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.28.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.28.attn_v.weightQ5_K[5120, 1280]
-
blk.28.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.28.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.28.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.29.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.29.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.29.attn_v.weightQ5_K[5120, 1280]
-
blk.29.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.29.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.30.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.30.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.30.attn_v.weightQ5_K[5120, 1280]
-
blk.30.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.30.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.30.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.31.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.31.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.31.attn_v.weightQ5_K[5120, 1280]
-
blk.31.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.31.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.32.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.32.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.32.attn_v.weightQ5_K[5120, 1280]
-
blk.32.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.32.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.32.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.33.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.33.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.33.attn_v.weightQ5_K[5120, 1280]
-
blk.33.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.33.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.33.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.34.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.34.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.34.attn_v.weightQ5_K[5120, 1280]
-
blk.34.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.34.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.34.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.35.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.35.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.35.attn_v.weightQ5_K[5120, 1280]
-
blk.35.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.35.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.35.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.36.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.36.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.36.attn_v.weightQ5_K[5120, 1280]
-
blk.36.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.36.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.36.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.37.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.37.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.37.attn_v.weightQ5_K[5120, 1280]
-
blk.37.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.37.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.38.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.38.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.38.attn_v.weightQ5_K[5120, 1280]
-
blk.38.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.38.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.38.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
blk.39.attn_k.weight(!unknown_type 23!)[5120, 1280]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.attn_output.weight(!unknown_type 23!)[5120, 5120]
-
blk.39.attn_q.weight(!unknown_type 23!)[5120, 5120]
-
blk.39.attn_v.weightQ5_K[5120, 1280]
-
blk.39.ffn_down.weight(!unknown_type 23!)[17920, 5120]
-
blk.39.ffn_gate.weight(!unknown_type 23!)[5120, 17920]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.ffn_up.weight(!unknown_type 23!)[5120, 17920]
-
output.weightQ6_K[5120, 32064]
-
output_norm.weightF32[5120]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39