InternLM2.5 has open-sourced a 20 billion parameter base model and a chat model tailored for practical scenarios.
281 Pulls Updated 3 months ago
4cc7a14a972d · 7.8GB
-
general.architectureinternlm2
-
general.file_type23
-
general.finetune..
-
general.licenseother
-
general.name..
-
general.quantization_version2
-
general.size_label20B
-
general.tags[text-generation]
-
general.typemodel
-
internlm2.attention.head_count48
-
internlm2.attention.head_count_kv8
-
internlm2.attention.layer_norm_rms_epsilon1e-05
-
internlm2.block_count48
-
internlm2.context_length32768
-
internlm2.embedding_length6144
-
internlm2.feed_forward_length16384
-
internlm2.rope.freq_base5e+07
-
quantize.imatrix.chunks_count136
-
quantize.imatrix.dataset/shared/opt/work_models/_imatrix/calibration_datav3.txt
-
quantize.imatrix.entries_count336
-
quantize.imatrix.fileimatrix.dat
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id92542
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id2
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000, -1000, -1000, 0, 0, ...]
-
tokenizer.ggml.token_type[3, 3, 3, 6, 6, ...]
-
tokenizer.ggml.tokens[<unk>, <s>, </s>, <0x00>, <0x01>, ...]
-
NameTypeShape
-
token_embd.weight(!unknown_type 21!)[6144, 92544]
-
blk.0.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.0.attn_norm.weightF32[6144]
-
blk.0.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.0.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.0.attn_v.weightQ4_K[6144, 1024]
-
blk.0.ffn_down.weightI32[16384, 6144]
-
blk.0.ffn_gate.weightI32[6144, 16384]
-
blk.0.ffn_norm.weightF32[6144]
-
blk.0.ffn_up.weightI32[6144, 16384]
-
blk.1.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.1.attn_norm.weightF32[6144]
-
blk.1.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.1.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.1.attn_v.weightQ4_K[6144, 1024]
-
blk.1.ffn_down.weightI32[16384, 6144]
-
blk.1.ffn_gate.weightI32[6144, 16384]
-
blk.1.ffn_norm.weightF32[6144]
-
blk.1.ffn_up.weightI32[6144, 16384]
-
blk.2.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.2.attn_norm.weightF32[6144]
-
blk.2.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.2.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.2.attn_v.weightQ4_K[6144, 1024]
-
blk.2.ffn_down.weightI32[16384, 6144]
-
blk.2.ffn_gate.weightI32[6144, 16384]
-
blk.2.ffn_norm.weightF32[6144]
-
blk.2.ffn_up.weightI32[6144, 16384]
-
blk.3.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.3.attn_norm.weightF32[6144]
-
blk.3.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.3.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.3.attn_v.weightQ4_K[6144, 1024]
-
blk.3.ffn_down.weightI32[16384, 6144]
-
blk.3.ffn_gate.weightI32[6144, 16384]
-
blk.3.ffn_norm.weightF32[6144]
-
blk.3.ffn_up.weightI32[6144, 16384]
-
blk.4.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.4.attn_norm.weightF32[6144]
-
blk.4.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.4.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.4.attn_v.weightQ4_K[6144, 1024]
-
blk.4.ffn_down.weightI32[16384, 6144]
-
blk.4.ffn_gate.weightI32[6144, 16384]
-
blk.4.ffn_norm.weightF32[6144]
-
blk.4.ffn_up.weightI32[6144, 16384]
-
blk.5.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.5.attn_norm.weightF32[6144]
-
blk.5.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.5.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.5.attn_v.weightQ4_K[6144, 1024]
-
blk.5.ffn_down.weightI32[16384, 6144]
-
blk.5.ffn_gate.weightI32[6144, 16384]
-
blk.5.ffn_norm.weightF32[6144]
-
blk.5.ffn_up.weightI32[6144, 16384]
-
blk.6.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.6.attn_norm.weightF32[6144]
-
blk.6.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.6.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.6.attn_v.weightQ4_K[6144, 1024]
-
blk.6.ffn_down.weightI32[16384, 6144]
-
blk.6.ffn_gate.weightI32[6144, 16384]
-
blk.6.ffn_norm.weightF32[6144]
-
blk.6.ffn_up.weightI32[6144, 16384]
-
blk.7.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.7.attn_norm.weightF32[6144]
-
blk.7.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.7.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.7.attn_v.weightQ4_K[6144, 1024]
-
blk.7.ffn_down.weightI32[16384, 6144]
-
blk.7.ffn_gate.weightI32[6144, 16384]
-
blk.7.ffn_norm.weightF32[6144]
-
blk.7.ffn_up.weightI32[6144, 16384]
-
blk.8.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.8.attn_norm.weightF32[6144]
-
blk.8.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.8.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.8.attn_v.weightQ4_K[6144, 1024]
-
blk.8.ffn_down.weightI32[16384, 6144]
-
blk.8.ffn_gate.weightI32[6144, 16384]
-
blk.8.ffn_norm.weightF32[6144]
-
blk.8.ffn_up.weightI32[6144, 16384]
-
blk.9.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.9.attn_norm.weightF32[6144]
-
blk.9.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.9.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.9.attn_v.weightQ4_K[6144, 1024]
-
blk.9.ffn_down.weightI32[16384, 6144]
-
blk.9.ffn_gate.weightI32[6144, 16384]
-
blk.9.ffn_norm.weightF32[6144]
-
blk.9.ffn_up.weightI32[6144, 16384]
-
blk.10.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.10.attn_norm.weightF32[6144]
-
blk.10.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.10.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.10.attn_v.weightQ4_K[6144, 1024]
-
blk.10.ffn_down.weightI32[16384, 6144]
-
blk.10.ffn_gate.weightI32[6144, 16384]
-
blk.10.ffn_norm.weightF32[6144]
-
blk.10.ffn_up.weightI32[6144, 16384]
-
blk.11.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.11.attn_norm.weightF32[6144]
-
blk.11.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.11.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.11.attn_v.weightQ4_K[6144, 1024]
-
blk.11.ffn_down.weightI32[16384, 6144]
-
blk.11.ffn_gate.weightI32[6144, 16384]
-
blk.11.ffn_norm.weightF32[6144]
-
blk.11.ffn_up.weightI32[6144, 16384]
-
blk.12.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.12.attn_norm.weightF32[6144]
-
blk.12.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.12.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.12.attn_v.weightQ4_K[6144, 1024]
-
blk.12.ffn_down.weightI32[16384, 6144]
-
blk.12.ffn_gate.weightI32[6144, 16384]
-
blk.12.ffn_norm.weightF32[6144]
-
blk.12.ffn_up.weightI32[6144, 16384]
-
blk.13.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.13.attn_norm.weightF32[6144]
-
blk.13.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.13.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.13.attn_v.weightQ4_K[6144, 1024]
-
blk.13.ffn_down.weightI32[16384, 6144]
-
blk.13.ffn_gate.weightI32[6144, 16384]
-
blk.13.ffn_norm.weightF32[6144]
-
blk.13.ffn_up.weightI32[6144, 16384]
-
blk.14.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.14.attn_norm.weightF32[6144]
-
blk.14.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.14.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.14.attn_v.weightQ4_K[6144, 1024]
-
blk.14.ffn_down.weightI32[16384, 6144]
-
blk.14.ffn_gate.weightI32[6144, 16384]
-
blk.14.ffn_norm.weightF32[6144]
-
blk.14.ffn_up.weightI32[6144, 16384]
-
blk.15.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.15.attn_norm.weightF32[6144]
-
blk.15.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.15.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.15.attn_v.weightQ4_K[6144, 1024]
-
blk.15.ffn_down.weightI32[16384, 6144]
-
blk.15.ffn_gate.weightI32[6144, 16384]
-
blk.15.ffn_norm.weightF32[6144]
-
blk.15.ffn_up.weightI32[6144, 16384]
-
blk.16.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.16.attn_norm.weightF32[6144]
-
blk.16.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.16.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.16.attn_v.weightQ4_K[6144, 1024]
-
blk.16.ffn_down.weightI32[16384, 6144]
-
blk.16.ffn_gate.weightI32[6144, 16384]
-
blk.16.ffn_norm.weightF32[6144]
-
blk.16.ffn_up.weightI32[6144, 16384]
-
blk.17.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.17.attn_norm.weightF32[6144]
-
blk.17.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.17.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.17.attn_v.weightQ4_K[6144, 1024]
-
blk.17.ffn_down.weightI32[16384, 6144]
-
blk.17.ffn_gate.weightI32[6144, 16384]
-
blk.17.ffn_norm.weightF32[6144]
-
blk.17.ffn_up.weightI32[6144, 16384]
-
blk.18.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.18.attn_norm.weightF32[6144]
-
blk.18.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.18.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.18.attn_v.weightQ4_K[6144, 1024]
-
blk.18.ffn_down.weightI32[16384, 6144]
-
blk.18.ffn_gate.weightI32[6144, 16384]
-
blk.18.ffn_norm.weightF32[6144]
-
blk.18.ffn_up.weightI32[6144, 16384]
-
blk.19.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.19.attn_norm.weightF32[6144]
-
blk.19.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.19.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.19.attn_v.weightQ4_K[6144, 1024]
-
blk.19.ffn_down.weightI32[16384, 6144]
-
blk.19.ffn_gate.weightI32[6144, 16384]
-
blk.19.ffn_norm.weightF32[6144]
-
blk.19.ffn_up.weightI32[6144, 16384]
-
blk.20.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.20.attn_norm.weightF32[6144]
-
blk.20.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.20.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.20.attn_v.weightQ4_K[6144, 1024]
-
blk.20.ffn_down.weightI32[16384, 6144]
-
blk.20.ffn_gate.weightI32[6144, 16384]
-
blk.20.ffn_norm.weightF32[6144]
-
blk.20.ffn_up.weightI32[6144, 16384]
-
blk.21.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.21.attn_norm.weightF32[6144]
-
blk.21.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.21.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.21.attn_v.weightQ4_K[6144, 1024]
-
blk.21.ffn_down.weightI32[16384, 6144]
-
blk.21.ffn_gate.weightI32[6144, 16384]
-
blk.21.ffn_norm.weightF32[6144]
-
blk.21.ffn_up.weightI32[6144, 16384]
-
blk.22.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.22.attn_norm.weightF32[6144]
-
blk.22.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.22.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.22.attn_v.weightQ4_K[6144, 1024]
-
blk.22.ffn_down.weightI32[16384, 6144]
-
blk.22.ffn_gate.weightI32[6144, 16384]
-
blk.22.ffn_norm.weightF32[6144]
-
blk.22.ffn_up.weightI32[6144, 16384]
-
blk.23.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.23.attn_norm.weightF32[6144]
-
blk.23.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.23.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.23.attn_v.weightQ4_K[6144, 1024]
-
blk.23.ffn_down.weightI32[16384, 6144]
-
blk.23.ffn_gate.weightI32[6144, 16384]
-
blk.23.ffn_norm.weightF32[6144]
-
blk.23.ffn_up.weightI32[6144, 16384]
-
blk.24.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.24.attn_norm.weightF32[6144]
-
blk.24.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.24.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.24.attn_v.weightQ4_K[6144, 1024]
-
blk.24.ffn_down.weightI32[16384, 6144]
-
blk.24.ffn_gate.weightI32[6144, 16384]
-
blk.24.ffn_norm.weightF32[6144]
-
blk.24.ffn_up.weightI32[6144, 16384]
-
blk.25.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.25.attn_norm.weightF32[6144]
-
blk.25.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.25.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.25.attn_v.weightQ4_K[6144, 1024]
-
blk.25.ffn_down.weightI32[16384, 6144]
-
blk.25.ffn_gate.weightI32[6144, 16384]
-
blk.25.ffn_norm.weightF32[6144]
-
blk.25.ffn_up.weightI32[6144, 16384]
-
blk.26.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.26.attn_norm.weightF32[6144]
-
blk.26.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.26.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.26.attn_v.weightQ4_K[6144, 1024]
-
blk.26.ffn_down.weightI32[16384, 6144]
-
blk.26.ffn_gate.weightI32[6144, 16384]
-
blk.26.ffn_norm.weightF32[6144]
-
blk.26.ffn_up.weightI32[6144, 16384]
-
blk.27.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.27.attn_norm.weightF32[6144]
-
blk.27.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.27.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.27.attn_v.weightQ4_K[6144, 1024]
-
blk.27.ffn_down.weightI32[16384, 6144]
-
blk.27.ffn_gate.weightI32[6144, 16384]
-
blk.27.ffn_norm.weightF32[6144]
-
blk.27.ffn_up.weightI32[6144, 16384]
-
blk.28.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.28.attn_norm.weightF32[6144]
-
blk.28.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.28.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.28.attn_v.weightQ4_K[6144, 1024]
-
blk.28.ffn_down.weightI32[16384, 6144]
-
blk.28.ffn_gate.weightI32[6144, 16384]
-
blk.28.ffn_norm.weightF32[6144]
-
blk.28.ffn_up.weightI32[6144, 16384]
-
blk.29.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.29.attn_norm.weightF32[6144]
-
blk.29.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.29.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.29.attn_v.weightQ4_K[6144, 1024]
-
blk.29.ffn_down.weightI32[16384, 6144]
-
blk.29.ffn_gate.weightI32[6144, 16384]
-
blk.29.ffn_norm.weightF32[6144]
-
blk.29.ffn_up.weightI32[6144, 16384]
-
blk.30.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.30.attn_norm.weightF32[6144]
-
blk.30.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.30.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.30.attn_v.weightQ4_K[6144, 1024]
-
blk.30.ffn_down.weightI32[16384, 6144]
-
blk.30.ffn_gate.weightI32[6144, 16384]
-
blk.30.ffn_norm.weightF32[6144]
-
blk.30.ffn_up.weightI32[6144, 16384]
-
blk.31.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.31.attn_norm.weightF32[6144]
-
blk.31.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.31.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.31.attn_v.weightQ4_K[6144, 1024]
-
blk.31.ffn_down.weightI32[16384, 6144]
-
blk.31.ffn_gate.weightI32[6144, 16384]
-
blk.31.ffn_norm.weightF32[6144]
-
blk.31.ffn_up.weightI32[6144, 16384]
-
blk.32.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.32.attn_norm.weightF32[6144]
-
blk.32.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.32.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.32.attn_v.weightQ4_K[6144, 1024]
-
blk.32.ffn_down.weightI32[16384, 6144]
-
blk.32.ffn_gate.weightI32[6144, 16384]
-
blk.32.ffn_norm.weightF32[6144]
-
blk.32.ffn_up.weightI32[6144, 16384]
-
blk.33.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.33.attn_norm.weightF32[6144]
-
blk.33.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.33.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.33.attn_v.weightQ4_K[6144, 1024]
-
blk.33.ffn_down.weightI32[16384, 6144]
-
blk.33.ffn_gate.weightI32[6144, 16384]
-
blk.33.ffn_norm.weightF32[6144]
-
blk.33.ffn_up.weightI32[6144, 16384]
-
blk.34.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.34.attn_norm.weightF32[6144]
-
blk.34.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.34.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.34.attn_v.weightQ4_K[6144, 1024]
-
blk.34.ffn_down.weightI32[16384, 6144]
-
blk.34.ffn_gate.weightI32[6144, 16384]
-
blk.34.ffn_norm.weightF32[6144]
-
blk.34.ffn_up.weightI32[6144, 16384]
-
blk.35.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.35.attn_norm.weightF32[6144]
-
blk.35.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.35.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.35.attn_v.weightQ4_K[6144, 1024]
-
blk.35.ffn_down.weightI32[16384, 6144]
-
blk.35.ffn_gate.weightI32[6144, 16384]
-
blk.35.ffn_norm.weightF32[6144]
-
blk.35.ffn_up.weightI32[6144, 16384]
-
blk.36.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.36.attn_norm.weightF32[6144]
-
blk.36.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.36.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.36.attn_v.weightQ4_K[6144, 1024]
-
blk.36.ffn_down.weightI32[16384, 6144]
-
blk.36.ffn_gate.weightI32[6144, 16384]
-
blk.36.ffn_norm.weightF32[6144]
-
blk.36.ffn_up.weightI32[6144, 16384]
-
blk.37.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.37.attn_norm.weightF32[6144]
-
blk.37.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.37.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.37.attn_v.weightQ4_K[6144, 1024]
-
blk.37.ffn_down.weightI32[16384, 6144]
-
blk.37.ffn_gate.weightI32[6144, 16384]
-
blk.37.ffn_norm.weightF32[6144]
-
blk.37.ffn_up.weightI32[6144, 16384]
-
blk.38.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.38.attn_norm.weightF32[6144]
-
blk.38.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.38.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.38.attn_v.weightQ4_K[6144, 1024]
-
blk.38.ffn_down.weightI32[16384, 6144]
-
blk.38.ffn_gate.weightI32[6144, 16384]
-
blk.38.ffn_norm.weightF32[6144]
-
blk.38.ffn_up.weightI32[6144, 16384]
-
blk.39.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.39.attn_norm.weightF32[6144]
-
blk.39.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.39.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.39.attn_v.weightQ4_K[6144, 1024]
-
blk.39.ffn_down.weightI32[16384, 6144]
-
blk.39.ffn_gate.weightI32[6144, 16384]
-
blk.39.ffn_norm.weightF32[6144]
-
blk.39.ffn_up.weightI32[6144, 16384]
-
blk.40.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.40.attn_norm.weightF32[6144]
-
blk.40.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.40.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.40.attn_v.weightQ4_K[6144, 1024]
-
blk.40.ffn_down.weightI32[16384, 6144]
-
blk.40.ffn_gate.weightI32[6144, 16384]
-
blk.40.ffn_norm.weightF32[6144]
-
blk.40.ffn_up.weightI32[6144, 16384]
-
blk.41.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.41.attn_norm.weightF32[6144]
-
blk.41.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.41.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.41.attn_v.weightQ4_K[6144, 1024]
-
blk.41.ffn_down.weightI32[16384, 6144]
-
blk.41.ffn_gate.weightI32[6144, 16384]
-
blk.41.ffn_norm.weightF32[6144]
-
blk.41.ffn_up.weightI32[6144, 16384]
-
blk.42.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.42.attn_norm.weightF32[6144]
-
blk.42.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.42.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.42.attn_v.weightQ4_K[6144, 1024]
-
blk.42.ffn_down.weightI32[16384, 6144]
-
blk.42.ffn_gate.weightI32[6144, 16384]
-
blk.42.ffn_norm.weightF32[6144]
-
blk.42.ffn_up.weightI32[6144, 16384]
-
blk.43.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.43.attn_norm.weightF32[6144]
-
blk.43.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.43.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.43.attn_v.weightQ4_K[6144, 1024]
-
blk.43.ffn_down.weightI32[16384, 6144]
-
blk.43.ffn_gate.weightI32[6144, 16384]
-
blk.43.ffn_norm.weightF32[6144]
-
blk.43.ffn_up.weightI32[6144, 16384]
-
blk.44.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.44.attn_norm.weightF32[6144]
-
blk.44.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.44.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.44.attn_v.weightQ4_K[6144, 1024]
-
blk.44.ffn_down.weightI32[16384, 6144]
-
blk.44.ffn_gate.weightI32[6144, 16384]
-
blk.44.ffn_norm.weightF32[6144]
-
blk.44.ffn_up.weightI32[6144, 16384]
-
blk.45.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.45.attn_norm.weightF32[6144]
-
blk.45.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.45.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.45.attn_v.weightQ4_K[6144, 1024]
-
blk.45.ffn_down.weightI32[16384, 6144]
-
blk.45.ffn_gate.weightI32[6144, 16384]
-
blk.45.ffn_norm.weightF32[6144]
-
blk.45.ffn_up.weightI32[6144, 16384]
-
blk.46.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.46.attn_norm.weightF32[6144]
-
blk.46.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.46.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.46.attn_v.weightQ4_K[6144, 1024]
-
blk.46.ffn_down.weightI32[16384, 6144]
-
blk.46.ffn_gate.weightI32[6144, 16384]
-
blk.46.ffn_norm.weightF32[6144]
-
blk.46.ffn_up.weightI32[6144, 16384]
-
blk.47.attn_k.weight(!unknown_type 22!)[6144, 1024]
-
blk.47.attn_norm.weightF32[6144]
-
blk.47.attn_output.weight(!unknown_type 21!)[6144, 6144]
-
blk.47.attn_q.weight(!unknown_type 22!)[6144, 6144]
-
blk.47.attn_v.weightQ4_K[6144, 1024]
-
blk.47.ffn_down.weightI32[16384, 6144]
-
blk.47.ffn_gate.weightI32[6144, 16384]
-
blk.47.ffn_norm.weightF32[6144]
-
blk.47.ffn_up.weightI32[6144, 16384]
-
output.weightQ5_K[6144, 92544]
-
output_norm.weightF32[6144]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47