InternLM2.5 has open-sourced a 20 billion parameter base model and a chat model tailored for practical scenarios.
281 Pulls Updated 3 months ago
52a0cf7285dd · 11GB
-
general.architectureinternlm2
-
general.file_type30
-
general.finetune..
-
general.licenseother
-
general.name..
-
general.quantization_version2
-
general.size_label20B
-
general.tags[text-generation]
-
general.typemodel
-
internlm2.attention.head_count48
-
internlm2.attention.head_count_kv8
-
internlm2.attention.layer_norm_rms_epsilon1e-05
-
internlm2.block_count48
-
internlm2.context_length32768
-
internlm2.embedding_length6144
-
internlm2.feed_forward_length16384
-
internlm2.rope.freq_base5e+07
-
quantize.imatrix.chunks_count136
-
quantize.imatrix.dataset/shared/opt/work_models/_imatrix/calibration_datav3.txt
-
quantize.imatrix.entries_count336
-
quantize.imatrix.fileimatrix.dat
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id92542
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id2
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000, -1000, -1000, 0, 0, ...]
-
tokenizer.ggml.token_type[3, 3, 3, 6, 6, ...]
-
tokenizer.ggml.tokens[<unk>, <s>, </s>, <0x00>, <0x01>, ...]
-
NameTypeShape
-
token_embd.weight(!unknown_type 23!)[6144, 92544]
-
blk.0.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.0.attn_norm.weightF32[6144]
-
blk.0.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.0.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.0.attn_v.weightQ5_K[6144, 1024]
-
blk.0.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.0.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.0.ffn_norm.weightF32[6144]
-
blk.0.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.1.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.1.attn_norm.weightF32[6144]
-
blk.1.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.1.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.1.attn_v.weightQ5_K[6144, 1024]
-
blk.1.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.1.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.1.ffn_norm.weightF32[6144]
-
blk.1.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.2.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.2.attn_norm.weightF32[6144]
-
blk.2.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.2.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.2.attn_v.weightQ5_K[6144, 1024]
-
blk.2.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.2.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.2.ffn_norm.weightF32[6144]
-
blk.2.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.3.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.3.attn_norm.weightF32[6144]
-
blk.3.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.3.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.3.attn_v.weightQ5_K[6144, 1024]
-
blk.3.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.3.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.3.ffn_norm.weightF32[6144]
-
blk.3.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.4.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.4.attn_norm.weightF32[6144]
-
blk.4.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.4.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.4.attn_v.weightQ5_K[6144, 1024]
-
blk.4.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.4.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.4.ffn_norm.weightF32[6144]
-
blk.4.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.5.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.5.attn_norm.weightF32[6144]
-
blk.5.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.5.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.5.attn_v.weightQ5_K[6144, 1024]
-
blk.5.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.5.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.5.ffn_norm.weightF32[6144]
-
blk.5.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.6.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.6.attn_norm.weightF32[6144]
-
blk.6.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.6.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.6.attn_v.weightQ5_K[6144, 1024]
-
blk.6.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.6.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.6.ffn_norm.weightF32[6144]
-
blk.6.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.7.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.7.attn_norm.weightF32[6144]
-
blk.7.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.7.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.7.attn_v.weightQ5_K[6144, 1024]
-
blk.7.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.7.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.7.ffn_norm.weightF32[6144]
-
blk.7.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.8.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.8.attn_norm.weightF32[6144]
-
blk.8.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.8.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.8.attn_v.weightQ5_K[6144, 1024]
-
blk.8.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.8.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.8.ffn_norm.weightF32[6144]
-
blk.8.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.9.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.9.attn_norm.weightF32[6144]
-
blk.9.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.9.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.9.attn_v.weightQ5_K[6144, 1024]
-
blk.9.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.9.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.9.ffn_norm.weightF32[6144]
-
blk.9.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.10.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.10.attn_norm.weightF32[6144]
-
blk.10.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.10.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.10.attn_v.weightQ5_K[6144, 1024]
-
blk.10.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.10.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.10.ffn_norm.weightF32[6144]
-
blk.10.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.11.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.11.attn_norm.weightF32[6144]
-
blk.11.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.11.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.11.attn_v.weightQ5_K[6144, 1024]
-
blk.11.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.11.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.11.ffn_norm.weightF32[6144]
-
blk.11.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.12.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.12.attn_norm.weightF32[6144]
-
blk.12.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.12.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.12.attn_v.weightQ5_K[6144, 1024]
-
blk.12.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.12.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.12.ffn_norm.weightF32[6144]
-
blk.12.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.13.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.13.attn_norm.weightF32[6144]
-
blk.13.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.13.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.13.attn_v.weightQ5_K[6144, 1024]
-
blk.13.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.13.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.13.ffn_norm.weightF32[6144]
-
blk.13.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.14.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.14.attn_norm.weightF32[6144]
-
blk.14.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.14.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.14.attn_v.weightQ5_K[6144, 1024]
-
blk.14.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.14.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.14.ffn_norm.weightF32[6144]
-
blk.14.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.15.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.15.attn_norm.weightF32[6144]
-
blk.15.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.15.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.15.attn_v.weightQ5_K[6144, 1024]
-
blk.15.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.15.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.15.ffn_norm.weightF32[6144]
-
blk.15.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.16.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.16.attn_norm.weightF32[6144]
-
blk.16.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.16.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.16.attn_v.weightQ5_K[6144, 1024]
-
blk.16.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.16.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.16.ffn_norm.weightF32[6144]
-
blk.16.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.17.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.17.attn_norm.weightF32[6144]
-
blk.17.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.17.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.17.attn_v.weightQ5_K[6144, 1024]
-
blk.17.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.17.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.17.ffn_norm.weightF32[6144]
-
blk.17.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.18.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.18.attn_norm.weightF32[6144]
-
blk.18.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.18.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.18.attn_v.weightQ5_K[6144, 1024]
-
blk.18.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.18.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.18.ffn_norm.weightF32[6144]
-
blk.18.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.19.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.19.attn_norm.weightF32[6144]
-
blk.19.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.19.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.19.attn_v.weightQ5_K[6144, 1024]
-
blk.19.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.19.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.19.ffn_norm.weightF32[6144]
-
blk.19.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.20.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.20.attn_norm.weightF32[6144]
-
blk.20.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.20.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.20.attn_v.weightQ5_K[6144, 1024]
-
blk.20.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.20.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.20.ffn_norm.weightF32[6144]
-
blk.20.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.21.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.21.attn_norm.weightF32[6144]
-
blk.21.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.21.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.21.attn_v.weightQ5_K[6144, 1024]
-
blk.21.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.21.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.21.ffn_norm.weightF32[6144]
-
blk.21.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.22.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.22.attn_norm.weightF32[6144]
-
blk.22.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.22.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.22.attn_v.weightQ5_K[6144, 1024]
-
blk.22.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.22.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.22.ffn_norm.weightF32[6144]
-
blk.22.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.23.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.23.attn_norm.weightF32[6144]
-
blk.23.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.23.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.23.attn_v.weightQ5_K[6144, 1024]
-
blk.23.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.23.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.23.ffn_norm.weightF32[6144]
-
blk.23.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.24.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.24.attn_norm.weightF32[6144]
-
blk.24.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.24.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.24.attn_v.weightQ5_K[6144, 1024]
-
blk.24.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.24.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.24.ffn_norm.weightF32[6144]
-
blk.24.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.25.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.25.attn_norm.weightF32[6144]
-
blk.25.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.25.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.25.attn_v.weightQ5_K[6144, 1024]
-
blk.25.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.25.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.25.ffn_norm.weightF32[6144]
-
blk.25.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.26.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.26.attn_norm.weightF32[6144]
-
blk.26.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.26.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.26.attn_v.weightQ5_K[6144, 1024]
-
blk.26.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.26.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.26.ffn_norm.weightF32[6144]
-
blk.26.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.27.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.27.attn_norm.weightF32[6144]
-
blk.27.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.27.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.27.attn_v.weightQ5_K[6144, 1024]
-
blk.27.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.27.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.27.ffn_norm.weightF32[6144]
-
blk.27.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.28.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.28.attn_norm.weightF32[6144]
-
blk.28.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.28.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.28.attn_v.weightQ5_K[6144, 1024]
-
blk.28.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.28.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.28.ffn_norm.weightF32[6144]
-
blk.28.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.29.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.29.attn_norm.weightF32[6144]
-
blk.29.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.29.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.29.attn_v.weightQ5_K[6144, 1024]
-
blk.29.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.29.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.29.ffn_norm.weightF32[6144]
-
blk.29.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.30.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.30.attn_norm.weightF32[6144]
-
blk.30.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.30.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.30.attn_v.weightQ5_K[6144, 1024]
-
blk.30.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.30.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.30.ffn_norm.weightF32[6144]
-
blk.30.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.31.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.31.attn_norm.weightF32[6144]
-
blk.31.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.31.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.31.attn_v.weightQ5_K[6144, 1024]
-
blk.31.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.31.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.31.ffn_norm.weightF32[6144]
-
blk.31.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.32.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.32.attn_norm.weightF32[6144]
-
blk.32.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.32.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.32.attn_v.weightQ5_K[6144, 1024]
-
blk.32.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.32.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.32.ffn_norm.weightF32[6144]
-
blk.32.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.33.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.33.attn_norm.weightF32[6144]
-
blk.33.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.33.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.33.attn_v.weightQ5_K[6144, 1024]
-
blk.33.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.33.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.33.ffn_norm.weightF32[6144]
-
blk.33.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.34.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.34.attn_norm.weightF32[6144]
-
blk.34.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.34.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.34.attn_v.weightQ5_K[6144, 1024]
-
blk.34.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.34.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.34.ffn_norm.weightF32[6144]
-
blk.34.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.35.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.35.attn_norm.weightF32[6144]
-
blk.35.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.35.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.35.attn_v.weightQ5_K[6144, 1024]
-
blk.35.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.35.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.35.ffn_norm.weightF32[6144]
-
blk.35.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.36.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.36.attn_norm.weightF32[6144]
-
blk.36.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.36.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.36.attn_v.weightQ5_K[6144, 1024]
-
blk.36.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.36.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.36.ffn_norm.weightF32[6144]
-
blk.36.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.37.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.37.attn_norm.weightF32[6144]
-
blk.37.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.37.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.37.attn_v.weightQ5_K[6144, 1024]
-
blk.37.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.37.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.37.ffn_norm.weightF32[6144]
-
blk.37.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.38.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.38.attn_norm.weightF32[6144]
-
blk.38.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.38.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.38.attn_v.weightQ5_K[6144, 1024]
-
blk.38.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.38.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.38.ffn_norm.weightF32[6144]
-
blk.38.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.39.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.39.attn_norm.weightF32[6144]
-
blk.39.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.39.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.39.attn_v.weightQ5_K[6144, 1024]
-
blk.39.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.39.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.39.ffn_norm.weightF32[6144]
-
blk.39.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.40.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.40.attn_norm.weightF32[6144]
-
blk.40.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.40.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.40.attn_v.weightQ5_K[6144, 1024]
-
blk.40.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.40.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.40.ffn_norm.weightF32[6144]
-
blk.40.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.41.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.41.attn_norm.weightF32[6144]
-
blk.41.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.41.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.41.attn_v.weightQ5_K[6144, 1024]
-
blk.41.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.41.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.41.ffn_norm.weightF32[6144]
-
blk.41.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.42.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.42.attn_norm.weightF32[6144]
-
blk.42.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.42.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.42.attn_v.weightQ5_K[6144, 1024]
-
blk.42.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.42.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.42.ffn_norm.weightF32[6144]
-
blk.42.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.43.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.43.attn_norm.weightF32[6144]
-
blk.43.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.43.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.43.attn_v.weightQ5_K[6144, 1024]
-
blk.43.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.43.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.43.ffn_norm.weightF32[6144]
-
blk.43.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.44.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.44.attn_norm.weightF32[6144]
-
blk.44.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.44.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.44.attn_v.weightQ5_K[6144, 1024]
-
blk.44.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.44.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.44.ffn_norm.weightF32[6144]
-
blk.44.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.45.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.45.attn_norm.weightF32[6144]
-
blk.45.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.45.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.45.attn_v.weightQ5_K[6144, 1024]
-
blk.45.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.45.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.45.ffn_norm.weightF32[6144]
-
blk.45.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.46.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.46.attn_norm.weightF32[6144]
-
blk.46.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.46.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.46.attn_v.weightQ5_K[6144, 1024]
-
blk.46.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.46.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.46.ffn_norm.weightF32[6144]
-
blk.46.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
blk.47.attn_k.weight(!unknown_type 23!)[6144, 1024]
-
blk.47.attn_norm.weightF32[6144]
-
blk.47.attn_output.weight(!unknown_type 23!)[6144, 6144]
-
blk.47.attn_q.weight(!unknown_type 23!)[6144, 6144]
-
blk.47.attn_v.weightQ5_K[6144, 1024]
-
blk.47.ffn_down.weight(!unknown_type 23!)[16384, 6144]
-
blk.47.ffn_gate.weight(!unknown_type 23!)[6144, 16384]
-
blk.47.ffn_norm.weightF32[6144]
-
blk.47.ffn_up.weight(!unknown_type 23!)[6144, 16384]
-
output.weightQ6_K[6144, 92544]
-
output_norm.weightF32[6144]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47