Polish LLM - Bielik-11B-v2.0-Instruct ~ by SpeakLeash a.k.a Spichlerz!
3 Pulls Updated 6 weeks ago
3de90ad3761a · 2.7GB
-
general.architecturellama
-
general.file_type31
-
general.nametekken
-
general.quantization_version2
-
general.size_label11B
-
general.typemodel
-
general.version2.0
-
llama.attention.head_count32
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count50
-
llama.context_length8192
-
llama.embedding_length4096
-
llama.feed_forward_length14336
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+06
-
llama.vocab_size32128
-
quantize.imatrix.chunks_count9208
-
quantize.imatrix.datasetdata/dataset_raw.txt
-
quantize.imatrix.entries_count350
-
quantize.imatrix.fileimatrix.dat
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixtrue
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id2
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000, -1000, -1000, 0, 0, ...]
-
tokenizer.ggml.token_type[3, 3, 3, 6, 6, ...]
-
tokenizer.ggml.tokens[<unk>, <s>, </s>, <0x00>, <0x01>, ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ2_K[4096, 32128]
-
blk.0.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.0.attn_norm.weightF32[4096]
-
blk.0.attn_output.weightI8[4096, 4096]
-
blk.0.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.0.attn_v.weightQ4_K[4096, 1024]
-
blk.0.ffn_down.weightQ2_K[14336, 4096]
-
blk.0.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.0.ffn_norm.weightF32[4096]
-
blk.0.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.1.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.1.attn_norm.weightF32[4096]
-
blk.1.attn_output.weightI8[4096, 4096]
-
blk.1.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.1.attn_v.weightQ4_K[4096, 1024]
-
blk.1.ffn_down.weightQ2_K[14336, 4096]
-
blk.1.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.1.ffn_norm.weightF32[4096]
-
blk.1.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.2.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.2.attn_norm.weightF32[4096]
-
blk.2.attn_output.weightI8[4096, 4096]
-
blk.2.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.2.attn_v.weightQ4_K[4096, 1024]
-
blk.2.ffn_down.weightQ2_K[14336, 4096]
-
blk.2.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.2.ffn_norm.weightF32[4096]
-
blk.2.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.3.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.3.attn_norm.weightF32[4096]
-
blk.3.attn_output.weightI8[4096, 4096]
-
blk.3.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.3.attn_v.weightQ4_K[4096, 1024]
-
blk.3.ffn_down.weightQ2_K[14336, 4096]
-
blk.3.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.3.ffn_norm.weightF32[4096]
-
blk.3.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.4.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.4.attn_norm.weightF32[4096]
-
blk.4.attn_output.weightI8[4096, 4096]
-
blk.4.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.4.attn_v.weightQ4_K[4096, 1024]
-
blk.4.ffn_down.weightQ2_K[14336, 4096]
-
blk.4.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.4.ffn_norm.weightF32[4096]
-
blk.4.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.5.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.5.attn_norm.weightF32[4096]
-
blk.5.attn_output.weightI8[4096, 4096]
-
blk.5.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.5.attn_v.weightQ4_K[4096, 1024]
-
blk.5.ffn_down.weightQ2_K[14336, 4096]
-
blk.5.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.5.ffn_norm.weightF32[4096]
-
blk.5.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.6.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.6.attn_norm.weightF32[4096]
-
blk.6.attn_output.weightI8[4096, 4096]
-
blk.6.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.6.attn_v.weightQ4_K[4096, 1024]
-
blk.6.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.6.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.6.ffn_norm.weightF32[4096]
-
blk.6.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.7.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.7.attn_norm.weightF32[4096]
-
blk.7.attn_output.weightI8[4096, 4096]
-
blk.7.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.7.attn_v.weightQ4_K[4096, 1024]
-
blk.7.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.7.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.7.ffn_norm.weightF32[4096]
-
blk.7.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.8.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.8.attn_norm.weightF32[4096]
-
blk.8.attn_output.weightI8[4096, 4096]
-
blk.8.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.8.attn_v.weightQ4_K[4096, 1024]
-
blk.8.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.8.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.8.ffn_norm.weightF32[4096]
-
blk.8.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.9.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.9.attn_norm.weightF32[4096]
-
blk.9.attn_output.weightI8[4096, 4096]
-
blk.9.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.9.attn_v.weightQ4_K[4096, 1024]
-
blk.9.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.9.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.9.ffn_norm.weightF32[4096]
-
blk.9.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.10.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.10.attn_norm.weightF32[4096]
-
blk.10.attn_output.weightI8[4096, 4096]
-
blk.10.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.10.attn_v.weightQ4_K[4096, 1024]
-
blk.10.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.10.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.10.ffn_norm.weightF32[4096]
-
blk.10.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.11.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.11.attn_norm.weightF32[4096]
-
blk.11.attn_output.weightI8[4096, 4096]
-
blk.11.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.11.attn_v.weightQ4_K[4096, 1024]
-
blk.11.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.11.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.11.ffn_norm.weightF32[4096]
-
blk.11.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.12.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.12.attn_norm.weightF32[4096]
-
blk.12.attn_output.weightI8[4096, 4096]
-
blk.12.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.12.attn_v.weightQ4_K[4096, 1024]
-
blk.12.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.12.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.12.ffn_norm.weightF32[4096]
-
blk.12.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.13.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.13.attn_norm.weightF32[4096]
-
blk.13.attn_output.weightI8[4096, 4096]
-
blk.13.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.13.attn_v.weightQ4_K[4096, 1024]
-
blk.13.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.13.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.13.ffn_norm.weightF32[4096]
-
blk.13.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.14.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.14.attn_norm.weightF32[4096]
-
blk.14.attn_output.weightI8[4096, 4096]
-
blk.14.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.14.attn_v.weightQ4_K[4096, 1024]
-
blk.14.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.14.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.14.ffn_norm.weightF32[4096]
-
blk.14.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.15.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.15.attn_norm.weightF32[4096]
-
blk.15.attn_output.weightI8[4096, 4096]
-
blk.15.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.15.attn_v.weightQ4_K[4096, 1024]
-
blk.15.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.15.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.15.ffn_norm.weightF32[4096]
-
blk.15.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.16.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.16.attn_norm.weightF32[4096]
-
blk.16.attn_output.weightI8[4096, 4096]
-
blk.16.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.16.attn_v.weightQ4_K[4096, 1024]
-
blk.16.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.16.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.16.ffn_norm.weightF32[4096]
-
blk.16.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.17.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.17.attn_norm.weightF32[4096]
-
blk.17.attn_output.weightI8[4096, 4096]
-
blk.17.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.17.attn_v.weightQ4_K[4096, 1024]
-
blk.17.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.17.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.17.ffn_norm.weightF32[4096]
-
blk.17.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.18.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.18.attn_norm.weightF32[4096]
-
blk.18.attn_output.weightI8[4096, 4096]
-
blk.18.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.18.attn_v.weightQ4_K[4096, 1024]
-
blk.18.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.18.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.18.ffn_norm.weightF32[4096]
-
blk.18.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.19.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.19.attn_norm.weightF32[4096]
-
blk.19.attn_output.weightI8[4096, 4096]
-
blk.19.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.19.attn_v.weightQ4_K[4096, 1024]
-
blk.19.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.19.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.19.ffn_norm.weightF32[4096]
-
blk.19.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.20.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.20.attn_norm.weightF32[4096]
-
blk.20.attn_output.weightI8[4096, 4096]
-
blk.20.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.20.attn_v.weightQ4_K[4096, 1024]
-
blk.20.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.20.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.20.ffn_norm.weightF32[4096]
-
blk.20.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.21.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.21.attn_norm.weightF32[4096]
-
blk.21.attn_output.weightI8[4096, 4096]
-
blk.21.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.21.attn_v.weightQ4_K[4096, 1024]
-
blk.21.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.21.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.21.ffn_norm.weightF32[4096]
-
blk.21.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.22.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.22.attn_norm.weightF32[4096]
-
blk.22.attn_output.weightI8[4096, 4096]
-
blk.22.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.22.attn_v.weightQ4_K[4096, 1024]
-
blk.22.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.22.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.22.ffn_norm.weightF32[4096]
-
blk.22.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.23.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.23.attn_norm.weightF32[4096]
-
blk.23.attn_output.weightI8[4096, 4096]
-
blk.23.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.23.attn_v.weightQ4_K[4096, 1024]
-
blk.23.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.23.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.23.ffn_norm.weightF32[4096]
-
blk.23.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.24.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.24.attn_norm.weightF32[4096]
-
blk.24.attn_output.weightI8[4096, 4096]
-
blk.24.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.24.attn_v.weightQ4_K[4096, 1024]
-
blk.24.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.24.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.24.ffn_norm.weightF32[4096]
-
blk.24.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.25.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.25.attn_norm.weightF32[4096]
-
blk.25.attn_output.weightI8[4096, 4096]
-
blk.25.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.25.attn_v.weightQ4_K[4096, 1024]
-
blk.25.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.25.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.25.ffn_norm.weightF32[4096]
-
blk.25.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.26.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.26.attn_norm.weightF32[4096]
-
blk.26.attn_output.weightI8[4096, 4096]
-
blk.26.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.26.attn_v.weightQ4_K[4096, 1024]
-
blk.26.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.26.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.26.ffn_norm.weightF32[4096]
-
blk.26.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.27.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.27.attn_norm.weightF32[4096]
-
blk.27.attn_output.weightI8[4096, 4096]
-
blk.27.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.27.attn_v.weightQ4_K[4096, 1024]
-
blk.27.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.27.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.27.ffn_norm.weightF32[4096]
-
blk.27.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.28.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.28.attn_norm.weightF32[4096]
-
blk.28.attn_output.weightI8[4096, 4096]
-
blk.28.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.28.attn_v.weightQ4_K[4096, 1024]
-
blk.28.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.28.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.28.ffn_norm.weightF32[4096]
-
blk.28.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.29.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.29.attn_norm.weightF32[4096]
-
blk.29.attn_output.weightI8[4096, 4096]
-
blk.29.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.29.attn_v.weightQ4_K[4096, 1024]
-
blk.29.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.29.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.29.ffn_norm.weightF32[4096]
-
blk.29.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.30.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.30.attn_norm.weightF32[4096]
-
blk.30.attn_output.weightI8[4096, 4096]
-
blk.30.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.30.attn_v.weightQ4_K[4096, 1024]
-
blk.30.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.30.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.30.ffn_norm.weightF32[4096]
-
blk.30.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.31.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.31.attn_norm.weightF32[4096]
-
blk.31.attn_output.weightI8[4096, 4096]
-
blk.31.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.31.attn_v.weightQ4_K[4096, 1024]
-
blk.31.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.31.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.31.ffn_norm.weightF32[4096]
-
blk.31.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.32.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.32.attn_norm.weightF32[4096]
-
blk.32.attn_output.weightI8[4096, 4096]
-
blk.32.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.32.attn_v.weightQ4_K[4096, 1024]
-
blk.32.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.32.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.32.ffn_norm.weightF32[4096]
-
blk.32.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.33.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.33.attn_norm.weightF32[4096]
-
blk.33.attn_output.weightI8[4096, 4096]
-
blk.33.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.33.attn_v.weightQ4_K[4096, 1024]
-
blk.33.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.33.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.33.ffn_norm.weightF32[4096]
-
blk.33.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.34.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.34.attn_norm.weightF32[4096]
-
blk.34.attn_output.weightI8[4096, 4096]
-
blk.34.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.34.attn_v.weightQ4_K[4096, 1024]
-
blk.34.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.34.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.34.ffn_norm.weightF32[4096]
-
blk.34.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.35.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.35.attn_norm.weightF32[4096]
-
blk.35.attn_output.weightI8[4096, 4096]
-
blk.35.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.35.attn_v.weightQ4_K[4096, 1024]
-
blk.35.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.35.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.35.ffn_norm.weightF32[4096]
-
blk.35.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.36.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.36.attn_norm.weightF32[4096]
-
blk.36.attn_output.weightI8[4096, 4096]
-
blk.36.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.36.attn_v.weightQ4_K[4096, 1024]
-
blk.36.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.36.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.36.ffn_norm.weightF32[4096]
-
blk.36.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.37.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.37.attn_norm.weightF32[4096]
-
blk.37.attn_output.weightI8[4096, 4096]
-
blk.37.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.37.attn_v.weightQ4_K[4096, 1024]
-
blk.37.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.37.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.37.ffn_norm.weightF32[4096]
-
blk.37.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.38.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.38.attn_norm.weightF32[4096]
-
blk.38.attn_output.weightI8[4096, 4096]
-
blk.38.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.38.attn_v.weightQ4_K[4096, 1024]
-
blk.38.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.38.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.38.ffn_norm.weightF32[4096]
-
blk.38.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.39.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.39.attn_norm.weightF32[4096]
-
blk.39.attn_output.weightI8[4096, 4096]
-
blk.39.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.39.attn_v.weightQ4_K[4096, 1024]
-
blk.39.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.39.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.39.ffn_norm.weightF32[4096]
-
blk.39.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.40.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.40.attn_norm.weightF32[4096]
-
blk.40.attn_output.weightI8[4096, 4096]
-
blk.40.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.40.attn_v.weightQ4_K[4096, 1024]
-
blk.40.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.40.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.40.ffn_norm.weightF32[4096]
-
blk.40.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.41.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.41.attn_norm.weightF32[4096]
-
blk.41.attn_output.weightI8[4096, 4096]
-
blk.41.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.41.attn_v.weightQ4_K[4096, 1024]
-
blk.41.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.41.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.41.ffn_norm.weightF32[4096]
-
blk.41.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.42.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.42.attn_norm.weightF32[4096]
-
blk.42.attn_output.weightI8[4096, 4096]
-
blk.42.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.42.attn_v.weightQ4_K[4096, 1024]
-
blk.42.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.42.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.42.ffn_norm.weightF32[4096]
-
blk.42.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.43.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.43.attn_norm.weightF32[4096]
-
blk.43.attn_output.weightI8[4096, 4096]
-
blk.43.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.43.attn_v.weightQ4_K[4096, 1024]
-
blk.43.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.43.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.43.ffn_norm.weightF32[4096]
-
blk.43.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.44.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.44.attn_norm.weightF32[4096]
-
blk.44.attn_output.weightI8[4096, 4096]
-
blk.44.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.44.attn_v.weightQ4_K[4096, 1024]
-
blk.44.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.44.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.44.ffn_norm.weightF32[4096]
-
blk.44.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.45.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.45.attn_norm.weightF32[4096]
-
blk.45.attn_output.weightI8[4096, 4096]
-
blk.45.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.45.attn_v.weightQ4_K[4096, 1024]
-
blk.45.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.45.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.45.ffn_norm.weightF32[4096]
-
blk.45.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.46.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.46.attn_norm.weightF32[4096]
-
blk.46.attn_output.weightI8[4096, 4096]
-
blk.46.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.46.attn_v.weightQ4_K[4096, 1024]
-
blk.46.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.46.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.46.ffn_norm.weightF32[4096]
-
blk.46.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.47.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.47.attn_norm.weightF32[4096]
-
blk.47.attn_output.weightI8[4096, 4096]
-
blk.47.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.47.attn_v.weightQ4_K[4096, 1024]
-
blk.47.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.47.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.47.ffn_norm.weightF32[4096]
-
blk.47.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.48.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.48.attn_norm.weightF32[4096]
-
blk.48.attn_output.weightI8[4096, 4096]
-
blk.48.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.48.attn_v.weightQ4_K[4096, 1024]
-
blk.48.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.48.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.48.ffn_norm.weightF32[4096]
-
blk.48.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.49.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.49.attn_norm.weightF32[4096]
-
blk.49.attn_output.weightI8[4096, 4096]
-
blk.49.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.49.attn_v.weightQ4_K[4096, 1024]
-
blk.49.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.49.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.49.ffn_norm.weightF32[4096]
-
blk.49.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
output.weightQ5_K[4096, 32128]
-
output_norm.weightF32[4096]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49