Polish LLM - Bielik-11B-v2.2-Instruct ~ by SpeakLeash a.k.a Spichlerz!
140 Pulls Updated 2 months ago
eb114bf96e58 · 2.7GB
-
general.architecturellama
-
general.basenamedpo7
-
general.file_type31
-
general.finetune007.3k
-
general.nametekken
-
general.quantization_version2
-
general.size_label11B
-
general.typemodel
-
llama.attention.head_count32
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count50
-
llama.context_length32768
-
llama.embedding_length4096
-
llama.feed_forward_length14336
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+06
-
llama.vocab_size32128
-
quantize.imatrix.chunks_count9208
-
quantize.imatrix.datasetdata/dataset_raw.txt
-
quantize.imatrix.entries_count350
-
quantize.imatrix.fileimatrix.dat
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixtrue
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id32001
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id2
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000, -1000, -1000, 0, 0, ...]
-
tokenizer.ggml.token_type[3, 3, 3, 6, 6, ...]
-
tokenizer.ggml.tokens[<unk>, <s>, </s>, <0x00>, <0x01>, ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ2_K[4096, 32128]
-
blk.0.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.0.attn_norm.weightF32[4096]
-
blk.0.attn_output.weightI8[4096, 4096]
-
blk.0.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.0.attn_v.weightQ4_K[4096, 1024]
-
blk.0.ffn_down.weightQ2_K[14336, 4096]
-
blk.0.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.0.ffn_norm.weightF32[4096]
-
blk.0.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.1.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.1.attn_norm.weightF32[4096]
-
blk.1.attn_output.weightI8[4096, 4096]
-
blk.1.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.1.attn_v.weightQ4_K[4096, 1024]
-
blk.1.ffn_down.weightQ2_K[14336, 4096]
-
blk.1.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.1.ffn_norm.weightF32[4096]
-
blk.1.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.2.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.2.attn_norm.weightF32[4096]
-
blk.2.attn_output.weightI8[4096, 4096]
-
blk.2.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.2.attn_v.weightQ4_K[4096, 1024]
-
blk.2.ffn_down.weightQ2_K[14336, 4096]
-
blk.2.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.2.ffn_norm.weightF32[4096]
-
blk.2.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.3.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.3.attn_norm.weightF32[4096]
-
blk.3.attn_output.weightI8[4096, 4096]
-
blk.3.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.3.attn_v.weightQ4_K[4096, 1024]
-
blk.3.ffn_down.weightQ2_K[14336, 4096]
-
blk.3.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.3.ffn_norm.weightF32[4096]
-
blk.3.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.4.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.4.attn_norm.weightF32[4096]
-
blk.4.attn_output.weightI8[4096, 4096]
-
blk.4.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.4.attn_v.weightQ4_K[4096, 1024]
-
blk.4.ffn_down.weightQ2_K[14336, 4096]
-
blk.4.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.4.ffn_norm.weightF32[4096]
-
blk.4.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.5.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.5.attn_norm.weightF32[4096]
-
blk.5.attn_output.weightI8[4096, 4096]
-
blk.5.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.5.attn_v.weightQ4_K[4096, 1024]
-
blk.5.ffn_down.weightQ2_K[14336, 4096]
-
blk.5.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.5.ffn_norm.weightF32[4096]
-
blk.5.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.6.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.6.attn_norm.weightF32[4096]
-
blk.6.attn_output.weightI8[4096, 4096]
-
blk.6.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.6.attn_v.weightQ4_K[4096, 1024]
-
blk.6.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.6.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.6.ffn_norm.weightF32[4096]
-
blk.6.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.7.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.7.attn_norm.weightF32[4096]
-
blk.7.attn_output.weightI8[4096, 4096]
-
blk.7.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.7.attn_v.weightQ4_K[4096, 1024]
-
blk.7.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.7.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.7.ffn_norm.weightF32[4096]
-
blk.7.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.8.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.8.attn_norm.weightF32[4096]
-
blk.8.attn_output.weightI8[4096, 4096]
-
blk.8.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.8.attn_v.weightQ4_K[4096, 1024]
-
blk.8.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.8.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.8.ffn_norm.weightF32[4096]
-
blk.8.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.9.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.9.attn_norm.weightF32[4096]
-
blk.9.attn_output.weightI8[4096, 4096]
-
blk.9.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.9.attn_v.weightQ4_K[4096, 1024]
-
blk.9.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.9.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.9.ffn_norm.weightF32[4096]
-
blk.9.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.10.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.10.attn_norm.weightF32[4096]
-
blk.10.attn_output.weightI8[4096, 4096]
-
blk.10.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.10.attn_v.weightQ4_K[4096, 1024]
-
blk.10.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.10.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.10.ffn_norm.weightF32[4096]
-
blk.10.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.11.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.11.attn_norm.weightF32[4096]
-
blk.11.attn_output.weightI8[4096, 4096]
-
blk.11.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.11.attn_v.weightQ4_K[4096, 1024]
-
blk.11.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.11.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.11.ffn_norm.weightF32[4096]
-
blk.11.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.12.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.12.attn_norm.weightF32[4096]
-
blk.12.attn_output.weightI8[4096, 4096]
-
blk.12.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.12.attn_v.weightQ4_K[4096, 1024]
-
blk.12.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.12.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.12.ffn_norm.weightF32[4096]
-
blk.12.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.13.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.13.attn_norm.weightF32[4096]
-
blk.13.attn_output.weightI8[4096, 4096]
-
blk.13.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.13.attn_v.weightQ4_K[4096, 1024]
-
blk.13.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.13.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.13.ffn_norm.weightF32[4096]
-
blk.13.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.14.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.14.attn_norm.weightF32[4096]
-
blk.14.attn_output.weightI8[4096, 4096]
-
blk.14.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.14.attn_v.weightQ4_K[4096, 1024]
-
blk.14.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.14.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.14.ffn_norm.weightF32[4096]
-
blk.14.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.15.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.15.attn_norm.weightF32[4096]
-
blk.15.attn_output.weightI8[4096, 4096]
-
blk.15.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.15.attn_v.weightQ4_K[4096, 1024]
-
blk.15.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.15.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.15.ffn_norm.weightF32[4096]
-
blk.15.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.16.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.16.attn_norm.weightF32[4096]
-
blk.16.attn_output.weightI8[4096, 4096]
-
blk.16.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.16.attn_v.weightQ4_K[4096, 1024]
-
blk.16.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.16.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.16.ffn_norm.weightF32[4096]
-
blk.16.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.17.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.17.attn_norm.weightF32[4096]
-
blk.17.attn_output.weightI8[4096, 4096]
-
blk.17.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.17.attn_v.weightQ4_K[4096, 1024]
-
blk.17.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.17.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.17.ffn_norm.weightF32[4096]
-
blk.17.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.18.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.18.attn_norm.weightF32[4096]
-
blk.18.attn_output.weightI8[4096, 4096]
-
blk.18.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.18.attn_v.weightQ4_K[4096, 1024]
-
blk.18.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.18.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.18.ffn_norm.weightF32[4096]
-
blk.18.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.19.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.19.attn_norm.weightF32[4096]
-
blk.19.attn_output.weightI8[4096, 4096]
-
blk.19.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.19.attn_v.weightQ4_K[4096, 1024]
-
blk.19.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.19.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.19.ffn_norm.weightF32[4096]
-
blk.19.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.20.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.20.attn_norm.weightF32[4096]
-
blk.20.attn_output.weightI8[4096, 4096]
-
blk.20.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.20.attn_v.weightQ4_K[4096, 1024]
-
blk.20.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.20.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.20.ffn_norm.weightF32[4096]
-
blk.20.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.21.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.21.attn_norm.weightF32[4096]
-
blk.21.attn_output.weightI8[4096, 4096]
-
blk.21.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.21.attn_v.weightQ4_K[4096, 1024]
-
blk.21.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.21.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.21.ffn_norm.weightF32[4096]
-
blk.21.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.22.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.22.attn_norm.weightF32[4096]
-
blk.22.attn_output.weightI8[4096, 4096]
-
blk.22.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.22.attn_v.weightQ4_K[4096, 1024]
-
blk.22.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.22.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.22.ffn_norm.weightF32[4096]
-
blk.22.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.23.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.23.attn_norm.weightF32[4096]
-
blk.23.attn_output.weightI8[4096, 4096]
-
blk.23.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.23.attn_v.weightQ4_K[4096, 1024]
-
blk.23.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.23.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.23.ffn_norm.weightF32[4096]
-
blk.23.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.24.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.24.attn_norm.weightF32[4096]
-
blk.24.attn_output.weightI8[4096, 4096]
-
blk.24.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.24.attn_v.weightQ4_K[4096, 1024]
-
blk.24.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.24.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.24.ffn_norm.weightF32[4096]
-
blk.24.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.25.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.25.attn_norm.weightF32[4096]
-
blk.25.attn_output.weightI8[4096, 4096]
-
blk.25.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.25.attn_v.weightQ4_K[4096, 1024]
-
blk.25.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.25.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.25.ffn_norm.weightF32[4096]
-
blk.25.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.26.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.26.attn_norm.weightF32[4096]
-
blk.26.attn_output.weightI8[4096, 4096]
-
blk.26.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.26.attn_v.weightQ4_K[4096, 1024]
-
blk.26.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.26.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.26.ffn_norm.weightF32[4096]
-
blk.26.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.27.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.27.attn_norm.weightF32[4096]
-
blk.27.attn_output.weightI8[4096, 4096]
-
blk.27.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.27.attn_v.weightQ4_K[4096, 1024]
-
blk.27.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.27.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.27.ffn_norm.weightF32[4096]
-
blk.27.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.28.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.28.attn_norm.weightF32[4096]
-
blk.28.attn_output.weightI8[4096, 4096]
-
blk.28.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.28.attn_v.weightQ4_K[4096, 1024]
-
blk.28.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.28.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.28.ffn_norm.weightF32[4096]
-
blk.28.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.29.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.29.attn_norm.weightF32[4096]
-
blk.29.attn_output.weightI8[4096, 4096]
-
blk.29.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.29.attn_v.weightQ4_K[4096, 1024]
-
blk.29.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.29.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.29.ffn_norm.weightF32[4096]
-
blk.29.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.30.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.30.attn_norm.weightF32[4096]
-
blk.30.attn_output.weightI8[4096, 4096]
-
blk.30.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.30.attn_v.weightQ4_K[4096, 1024]
-
blk.30.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.30.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.30.ffn_norm.weightF32[4096]
-
blk.30.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.31.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.31.attn_norm.weightF32[4096]
-
blk.31.attn_output.weightI8[4096, 4096]
-
blk.31.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.31.attn_v.weightQ4_K[4096, 1024]
-
blk.31.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.31.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.31.ffn_norm.weightF32[4096]
-
blk.31.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.32.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.32.attn_norm.weightF32[4096]
-
blk.32.attn_output.weightI8[4096, 4096]
-
blk.32.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.32.attn_v.weightQ4_K[4096, 1024]
-
blk.32.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.32.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.32.ffn_norm.weightF32[4096]
-
blk.32.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.33.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.33.attn_norm.weightF32[4096]
-
blk.33.attn_output.weightI8[4096, 4096]
-
blk.33.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.33.attn_v.weightQ4_K[4096, 1024]
-
blk.33.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.33.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.33.ffn_norm.weightF32[4096]
-
blk.33.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.34.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.34.attn_norm.weightF32[4096]
-
blk.34.attn_output.weightI8[4096, 4096]
-
blk.34.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.34.attn_v.weightQ4_K[4096, 1024]
-
blk.34.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.34.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.34.ffn_norm.weightF32[4096]
-
blk.34.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.35.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.35.attn_norm.weightF32[4096]
-
blk.35.attn_output.weightI8[4096, 4096]
-
blk.35.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.35.attn_v.weightQ4_K[4096, 1024]
-
blk.35.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.35.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.35.ffn_norm.weightF32[4096]
-
blk.35.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.36.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.36.attn_norm.weightF32[4096]
-
blk.36.attn_output.weightI8[4096, 4096]
-
blk.36.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.36.attn_v.weightQ4_K[4096, 1024]
-
blk.36.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.36.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.36.ffn_norm.weightF32[4096]
-
blk.36.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.37.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.37.attn_norm.weightF32[4096]
-
blk.37.attn_output.weightI8[4096, 4096]
-
blk.37.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.37.attn_v.weightQ4_K[4096, 1024]
-
blk.37.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.37.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.37.ffn_norm.weightF32[4096]
-
blk.37.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.38.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.38.attn_norm.weightF32[4096]
-
blk.38.attn_output.weightI8[4096, 4096]
-
blk.38.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.38.attn_v.weightQ4_K[4096, 1024]
-
blk.38.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.38.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.38.ffn_norm.weightF32[4096]
-
blk.38.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.39.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.39.attn_norm.weightF32[4096]
-
blk.39.attn_output.weightI8[4096, 4096]
-
blk.39.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.39.attn_v.weightQ4_K[4096, 1024]
-
blk.39.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.39.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.39.ffn_norm.weightF32[4096]
-
blk.39.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.40.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.40.attn_norm.weightF32[4096]
-
blk.40.attn_output.weightI8[4096, 4096]
-
blk.40.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.40.attn_v.weightQ4_K[4096, 1024]
-
blk.40.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.40.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.40.ffn_norm.weightF32[4096]
-
blk.40.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.41.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.41.attn_norm.weightF32[4096]
-
blk.41.attn_output.weightI8[4096, 4096]
-
blk.41.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.41.attn_v.weightQ4_K[4096, 1024]
-
blk.41.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.41.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.41.ffn_norm.weightF32[4096]
-
blk.41.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.42.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.42.attn_norm.weightF32[4096]
-
blk.42.attn_output.weightI8[4096, 4096]
-
blk.42.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.42.attn_v.weightQ4_K[4096, 1024]
-
blk.42.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.42.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.42.ffn_norm.weightF32[4096]
-
blk.42.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.43.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.43.attn_norm.weightF32[4096]
-
blk.43.attn_output.weightI8[4096, 4096]
-
blk.43.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.43.attn_v.weightQ4_K[4096, 1024]
-
blk.43.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.43.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.43.ffn_norm.weightF32[4096]
-
blk.43.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.44.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.44.attn_norm.weightF32[4096]
-
blk.44.attn_output.weightI8[4096, 4096]
-
blk.44.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.44.attn_v.weightQ4_K[4096, 1024]
-
blk.44.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.44.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.44.ffn_norm.weightF32[4096]
-
blk.44.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.45.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.45.attn_norm.weightF32[4096]
-
blk.45.attn_output.weightI8[4096, 4096]
-
blk.45.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.45.attn_v.weightQ4_K[4096, 1024]
-
blk.45.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.45.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.45.ffn_norm.weightF32[4096]
-
blk.45.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.46.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.46.attn_norm.weightF32[4096]
-
blk.46.attn_output.weightI8[4096, 4096]
-
blk.46.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.46.attn_v.weightQ4_K[4096, 1024]
-
blk.46.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.46.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.46.ffn_norm.weightF32[4096]
-
blk.46.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.47.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.47.attn_norm.weightF32[4096]
-
blk.47.attn_output.weightI8[4096, 4096]
-
blk.47.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.47.attn_v.weightQ4_K[4096, 1024]
-
blk.47.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.47.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.47.ffn_norm.weightF32[4096]
-
blk.47.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.48.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.48.attn_norm.weightF32[4096]
-
blk.48.attn_output.weightI8[4096, 4096]
-
blk.48.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.48.attn_v.weightQ4_K[4096, 1024]
-
blk.48.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.48.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.48.ffn_norm.weightF32[4096]
-
blk.48.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
blk.49.attn_k.weight(!unknown_type 29!)[4096, 1024]
-
blk.49.attn_norm.weightF32[4096]
-
blk.49.attn_output.weightI8[4096, 4096]
-
blk.49.attn_q.weight(!unknown_type 29!)[4096, 4096]
-
blk.49.attn_v.weightQ4_K[4096, 1024]
-
blk.49.ffn_down.weight(!unknown_type 29!)[14336, 4096]
-
blk.49.ffn_gate.weight(!unknown_type 29!)[4096, 14336]
-
blk.49.ffn_norm.weightF32[4096]
-
blk.49.ffn_up.weight(!unknown_type 29!)[4096, 14336]
-
output.weightQ5_K[4096, 32128]
-
output_norm.weightF32[4096]
Metadata
Tensor
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49