Fietje: An open and efficient LLM for Dutch (base)
3B
85 Pulls Updated 4 months ago
5f3d4de8e402 · 1.4GB
-
general.architecturephi2
-
general.file_typeQ3_K_M
-
phi2.attention.head_count32
-
phi2.attention.head_count_kv32
-
phi2.attention.layer_norm_epsilon1e-05
-
phi2.block_count32
-
phi2.context_length2048
-
phi2.embedding_length2560
-
phi2.feed_forward_length10240
-
phi2.rope.dimension_count32
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.bos_token_id50256
-
tokenizer.ggml.eos_token_id50256
-
tokenizer.ggml.merges[Ġ t Ġ a h e i n r e ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id50256
-
tokenizer.ggml.prephi-2
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
tokenizer.ggml.unknown_token_id50256
-
NameTypeShape
-
token_embd.weightQ3_K[2560 51200]
-
blk.0.attn_norm.biasF32[2560]
-
blk.0.attn_norm.weightF32[2560]
-
blk.0.ffn_up.biasF32[10240]
-
blk.0.ffn_up.weightQ3_K[2560 10240]
-
blk.0.ffn_down.biasF32[2560]
-
blk.0.ffn_down.weightQ5_K[10240 2560]
-
blk.0.attn_output.biasF32[2560]
-
blk.0.attn_output.weightQ4_K[2560 2560]
-
blk.0.attn_k.biasF32[2560]
-
blk.0.attn_k.weightQ3_K[2560 2560]
-
blk.0.attn_q.biasF32[2560]
-
blk.0.attn_q.weightQ3_K[2560 2560]
-
blk.0.attn_v.biasF32[2560]
-
blk.0.attn_v.weightQ5_K[2560 2560]
-
blk.1.attn_norm.biasF32[2560]
-
blk.1.attn_norm.weightF32[2560]
-
blk.1.ffn_up.biasF32[10240]
-
blk.1.ffn_up.weightQ3_K[2560 10240]
-
blk.1.ffn_down.biasF32[2560]
-
blk.1.ffn_down.weightQ5_K[10240 2560]
-
blk.1.attn_output.biasF32[2560]
-
blk.1.attn_output.weightQ4_K[2560 2560]
-
blk.1.attn_k.biasF32[2560]
-
blk.1.attn_k.weightQ3_K[2560 2560]
-
blk.1.attn_q.biasF32[2560]
-
blk.1.attn_q.weightQ3_K[2560 2560]
-
blk.1.attn_v.biasF32[2560]
-
blk.1.attn_v.weightQ5_K[2560 2560]
-
blk.2.attn_norm.biasF32[2560]
-
blk.2.attn_norm.weightF32[2560]
-
blk.2.ffn_up.biasF32[10240]
-
blk.2.ffn_up.weightQ3_K[2560 10240]
-
blk.2.ffn_down.biasF32[2560]
-
blk.2.ffn_down.weightQ4_K[10240 2560]
-
blk.2.attn_output.biasF32[2560]
-
blk.2.attn_output.weightQ4_K[2560 2560]
-
blk.2.attn_k.biasF32[2560]
-
blk.2.attn_k.weightQ3_K[2560 2560]
-
blk.2.attn_q.biasF32[2560]
-
blk.2.attn_q.weightQ3_K[2560 2560]
-
blk.2.attn_v.biasF32[2560]
-
blk.2.attn_v.weightQ4_K[2560 2560]
-
blk.3.attn_norm.biasF32[2560]
-
blk.3.attn_norm.weightF32[2560]
-
blk.3.ffn_up.biasF32[10240]
-
blk.3.ffn_up.weightQ3_K[2560 10240]
-
blk.3.ffn_down.biasF32[2560]
-
blk.3.ffn_down.weightQ4_K[10240 2560]
-
blk.3.attn_output.biasF32[2560]
-
blk.3.attn_output.weightQ4_K[2560 2560]
-
blk.3.attn_k.biasF32[2560]
-
blk.3.attn_k.weightQ3_K[2560 2560]
-
blk.3.attn_q.biasF32[2560]
-
blk.3.attn_q.weightQ3_K[2560 2560]
-
blk.3.attn_v.biasF32[2560]
-
blk.3.attn_v.weightQ4_K[2560 2560]
-
blk.4.attn_norm.biasF32[2560]
-
blk.4.attn_norm.weightF32[2560]
-
blk.4.ffn_up.biasF32[10240]
-
blk.4.ffn_up.weightQ3_K[2560 10240]
-
blk.4.ffn_down.biasF32[2560]
-
blk.4.ffn_down.weightQ4_K[10240 2560]
-
blk.4.attn_output.biasF32[2560]
-
blk.4.attn_output.weightQ4_K[2560 2560]
-
blk.4.attn_k.biasF32[2560]
-
blk.4.attn_k.weightQ3_K[2560 2560]
-
blk.4.attn_q.biasF32[2560]
-
blk.4.attn_q.weightQ3_K[2560 2560]
-
blk.4.attn_v.biasF32[2560]
-
blk.4.attn_v.weightQ4_K[2560 2560]
-
blk.5.attn_norm.biasF32[2560]
-
blk.5.attn_norm.weightF32[2560]
-
blk.5.ffn_up.biasF32[10240]
-
blk.5.ffn_up.weightQ3_K[2560 10240]
-
blk.5.ffn_down.biasF32[2560]
-
blk.5.ffn_down.weightQ4_K[10240 2560]
-
blk.5.attn_output.biasF32[2560]
-
blk.5.attn_output.weightQ4_K[2560 2560]
-
blk.5.attn_k.biasF32[2560]
-
blk.5.attn_k.weightQ3_K[2560 2560]
-
blk.5.attn_q.biasF32[2560]
-
blk.5.attn_q.weightQ3_K[2560 2560]
-
blk.5.attn_v.biasF32[2560]
-
blk.5.attn_v.weightQ4_K[2560 2560]
-
blk.6.attn_norm.biasF32[2560]
-
blk.6.attn_norm.weightF32[2560]
-
blk.6.ffn_up.biasF32[10240]
-
blk.6.ffn_up.weightQ3_K[2560 10240]
-
blk.6.ffn_down.biasF32[2560]
-
blk.6.ffn_down.weightQ4_K[10240 2560]
-
blk.6.attn_output.biasF32[2560]
-
blk.6.attn_output.weightQ4_K[2560 2560]
-
blk.6.attn_k.biasF32[2560]
-
blk.6.attn_k.weightQ3_K[2560 2560]
-
blk.6.attn_q.biasF32[2560]
-
blk.6.attn_q.weightQ3_K[2560 2560]
-
blk.6.attn_v.biasF32[2560]
-
blk.6.attn_v.weightQ4_K[2560 2560]
-
blk.7.attn_norm.biasF32[2560]
-
blk.7.attn_norm.weightF32[2560]
-
blk.7.ffn_up.biasF32[10240]
-
blk.7.ffn_up.weightQ3_K[2560 10240]
-
blk.7.ffn_down.biasF32[2560]
-
blk.7.ffn_down.weightQ4_K[10240 2560]
-
blk.7.attn_output.biasF32[2560]
-
blk.7.attn_output.weightQ4_K[2560 2560]
-
blk.7.attn_k.biasF32[2560]
-
blk.7.attn_k.weightQ3_K[2560 2560]
-
blk.7.attn_q.biasF32[2560]
-
blk.7.attn_q.weightQ3_K[2560 2560]
-
blk.7.attn_v.biasF32[2560]
-
blk.7.attn_v.weightQ4_K[2560 2560]
-
blk.8.attn_norm.biasF32[2560]
-
blk.8.attn_norm.weightF32[2560]
-
blk.8.ffn_up.biasF32[10240]
-
blk.8.ffn_up.weightQ3_K[2560 10240]
-
blk.8.ffn_down.biasF32[2560]
-
blk.8.ffn_down.weightQ4_K[10240 2560]
-
blk.8.attn_output.biasF32[2560]
-
blk.8.attn_output.weightQ4_K[2560 2560]
-
blk.8.attn_k.biasF32[2560]
-
blk.8.attn_k.weightQ3_K[2560 2560]
-
blk.8.attn_q.biasF32[2560]
-
blk.8.attn_q.weightQ3_K[2560 2560]
-
blk.8.attn_v.biasF32[2560]
-
blk.8.attn_v.weightQ4_K[2560 2560]
-
blk.9.attn_norm.biasF32[2560]
-
blk.9.attn_norm.weightF32[2560]
-
blk.9.ffn_up.biasF32[10240]
-
blk.9.ffn_up.weightQ3_K[2560 10240]
-
blk.9.ffn_down.biasF32[2560]
-
blk.9.ffn_down.weightQ4_K[10240 2560]
-
blk.9.attn_output.biasF32[2560]
-
blk.9.attn_output.weightQ4_K[2560 2560]
-
blk.9.attn_k.biasF32[2560]
-
blk.9.attn_k.weightQ3_K[2560 2560]
-
blk.9.attn_q.biasF32[2560]
-
blk.9.attn_q.weightQ3_K[2560 2560]
-
blk.9.attn_v.biasF32[2560]
-
blk.9.attn_v.weightQ4_K[2560 2560]
-
blk.10.attn_norm.biasF32[2560]
-
blk.10.attn_norm.weightF32[2560]
-
blk.10.ffn_up.biasF32[10240]
-
blk.10.ffn_up.weightQ3_K[2560 10240]
-
blk.10.ffn_down.biasF32[2560]
-
blk.10.ffn_down.weightQ4_K[10240 2560]
-
blk.10.attn_output.biasF32[2560]
-
blk.10.attn_output.weightQ4_K[2560 2560]
-
blk.10.attn_k.biasF32[2560]
-
blk.10.attn_k.weightQ3_K[2560 2560]
-
blk.10.attn_q.biasF32[2560]
-
blk.10.attn_q.weightQ3_K[2560 2560]
-
blk.10.attn_v.biasF32[2560]
-
blk.10.attn_v.weightQ4_K[2560 2560]
-
blk.11.attn_norm.biasF32[2560]
-
blk.11.attn_norm.weightF32[2560]
-
blk.11.ffn_up.biasF32[10240]
-
blk.11.ffn_up.weightQ3_K[2560 10240]
-
blk.11.ffn_down.biasF32[2560]
-
blk.11.ffn_down.weightQ4_K[10240 2560]
-
blk.11.attn_output.biasF32[2560]
-
blk.11.attn_output.weightQ4_K[2560 2560]
-
blk.11.attn_k.biasF32[2560]
-
blk.11.attn_k.weightQ3_K[2560 2560]
-
blk.11.attn_q.biasF32[2560]
-
blk.11.attn_q.weightQ3_K[2560 2560]
-
blk.11.attn_v.biasF32[2560]
-
blk.11.attn_v.weightQ4_K[2560 2560]
-
blk.12.attn_norm.biasF32[2560]
-
blk.12.attn_norm.weightF32[2560]
-
blk.12.ffn_up.biasF32[10240]
-
blk.12.ffn_up.weightQ3_K[2560 10240]
-
blk.12.ffn_down.biasF32[2560]
-
blk.12.ffn_down.weightQ4_K[10240 2560]
-
blk.12.attn_output.biasF32[2560]
-
blk.12.attn_output.weightQ4_K[2560 2560]
-
blk.12.attn_k.biasF32[2560]
-
blk.12.attn_k.weightQ3_K[2560 2560]
-
blk.12.attn_q.biasF32[2560]
-
blk.12.attn_q.weightQ3_K[2560 2560]
-
blk.12.attn_v.biasF32[2560]
-
blk.12.attn_v.weightQ4_K[2560 2560]
-
blk.13.attn_norm.biasF32[2560]
-
blk.13.attn_norm.weightF32[2560]
-
blk.13.ffn_up.biasF32[10240]
-
blk.13.ffn_up.weightQ3_K[2560 10240]
-
blk.13.ffn_down.biasF32[2560]
-
blk.13.ffn_down.weightQ4_K[10240 2560]
-
blk.13.attn_output.biasF32[2560]
-
blk.13.attn_output.weightQ4_K[2560 2560]
-
blk.13.attn_k.biasF32[2560]
-
blk.13.attn_k.weightQ3_K[2560 2560]
-
blk.13.attn_q.biasF32[2560]
-
blk.13.attn_q.weightQ3_K[2560 2560]
-
blk.13.attn_v.biasF32[2560]
-
blk.13.attn_v.weightQ4_K[2560 2560]
-
blk.14.attn_norm.biasF32[2560]
-
blk.14.attn_norm.weightF32[2560]
-
blk.14.ffn_up.biasF32[10240]
-
blk.14.ffn_up.weightQ3_K[2560 10240]
-
blk.14.ffn_down.biasF32[2560]
-
blk.14.ffn_down.weightQ4_K[10240 2560]
-
blk.14.attn_output.biasF32[2560]
-
blk.14.attn_output.weightQ4_K[2560 2560]
-
blk.14.attn_k.biasF32[2560]
-
blk.14.attn_k.weightQ3_K[2560 2560]
-
blk.14.attn_q.biasF32[2560]
-
blk.14.attn_q.weightQ3_K[2560 2560]
-
blk.14.attn_v.biasF32[2560]
-
blk.14.attn_v.weightQ4_K[2560 2560]
-
blk.15.attn_norm.biasF32[2560]
-
blk.15.attn_norm.weightF32[2560]
-
blk.15.ffn_up.biasF32[10240]
-
blk.15.ffn_up.weightQ3_K[2560 10240]
-
blk.15.ffn_down.biasF32[2560]
-
blk.15.ffn_down.weightQ4_K[10240 2560]
-
blk.15.attn_output.biasF32[2560]
-
blk.15.attn_output.weightQ4_K[2560 2560]
-
blk.15.attn_k.biasF32[2560]
-
blk.15.attn_k.weightQ3_K[2560 2560]
-
blk.15.attn_q.biasF32[2560]
-
blk.15.attn_q.weightQ3_K[2560 2560]
-
blk.15.attn_v.biasF32[2560]
-
blk.15.attn_v.weightQ4_K[2560 2560]
-
blk.16.attn_norm.biasF32[2560]
-
blk.16.attn_norm.weightF32[2560]
-
blk.16.ffn_up.biasF32[10240]
-
blk.16.ffn_up.weightQ3_K[2560 10240]
-
blk.16.ffn_down.biasF32[2560]
-
blk.16.ffn_down.weightQ4_K[10240 2560]
-
blk.16.attn_output.biasF32[2560]
-
blk.16.attn_output.weightQ4_K[2560 2560]
-
blk.16.attn_k.biasF32[2560]
-
blk.16.attn_k.weightQ3_K[2560 2560]
-
blk.16.attn_q.biasF32[2560]
-
blk.16.attn_q.weightQ3_K[2560 2560]
-
blk.16.attn_v.biasF32[2560]
-
blk.16.attn_v.weightQ4_K[2560 2560]
-
blk.17.attn_norm.biasF32[2560]
-
blk.17.attn_norm.weightF32[2560]
-
blk.17.ffn_up.biasF32[10240]
-
blk.17.ffn_up.weightQ3_K[2560 10240]
-
blk.17.ffn_down.biasF32[2560]
-
blk.17.ffn_down.weightQ4_K[10240 2560]
-
blk.17.attn_output.biasF32[2560]
-
blk.17.attn_output.weightQ4_K[2560 2560]
-
blk.17.attn_k.biasF32[2560]
-
blk.17.attn_k.weightQ3_K[2560 2560]
-
blk.17.attn_q.biasF32[2560]
-
blk.17.attn_q.weightQ3_K[2560 2560]
-
blk.17.attn_v.biasF32[2560]
-
blk.17.attn_v.weightQ4_K[2560 2560]
-
blk.18.attn_norm.biasF32[2560]
-
blk.18.attn_norm.weightF32[2560]
-
blk.18.ffn_up.biasF32[10240]
-
blk.18.ffn_up.weightQ3_K[2560 10240]
-
blk.18.ffn_down.biasF32[2560]
-
blk.18.ffn_down.weightQ4_K[10240 2560]
-
blk.18.attn_output.biasF32[2560]
-
blk.18.attn_output.weightQ4_K[2560 2560]
-
blk.18.attn_k.biasF32[2560]
-
blk.18.attn_k.weightQ3_K[2560 2560]
-
blk.18.attn_q.biasF32[2560]
-
blk.18.attn_q.weightQ3_K[2560 2560]
-
blk.18.attn_v.biasF32[2560]
-
blk.18.attn_v.weightQ4_K[2560 2560]
-
blk.19.attn_norm.biasF32[2560]
-
blk.19.attn_norm.weightF32[2560]
-
blk.19.ffn_up.biasF32[10240]
-
blk.19.ffn_up.weightQ3_K[2560 10240]
-
blk.19.ffn_down.biasF32[2560]
-
blk.19.ffn_down.weightQ4_K[10240 2560]
-
blk.19.attn_output.biasF32[2560]
-
blk.19.attn_output.weightQ4_K[2560 2560]
-
blk.19.attn_k.biasF32[2560]
-
blk.19.attn_k.weightQ3_K[2560 2560]
-
blk.19.attn_q.biasF32[2560]
-
blk.19.attn_q.weightQ3_K[2560 2560]
-
blk.19.attn_v.biasF32[2560]
-
blk.19.attn_v.weightQ4_K[2560 2560]
-
blk.20.attn_norm.biasF32[2560]
-
blk.20.attn_norm.weightF32[2560]
-
blk.20.ffn_up.biasF32[10240]
-
blk.20.ffn_up.weightQ3_K[2560 10240]
-
blk.20.ffn_down.biasF32[2560]
-
blk.20.ffn_down.weightQ4_K[10240 2560]
-
blk.20.attn_output.biasF32[2560]
-
blk.20.attn_output.weightQ4_K[2560 2560]
-
blk.20.attn_k.biasF32[2560]
-
blk.20.attn_k.weightQ3_K[2560 2560]
-
blk.20.attn_q.biasF32[2560]
-
blk.20.attn_q.weightQ3_K[2560 2560]
-
blk.20.attn_v.biasF32[2560]
-
blk.20.attn_v.weightQ4_K[2560 2560]
-
blk.21.attn_norm.biasF32[2560]
-
blk.21.attn_norm.weightF32[2560]
-
blk.21.ffn_up.biasF32[10240]
-
blk.21.ffn_up.weightQ3_K[2560 10240]
-
blk.21.ffn_down.biasF32[2560]
-
blk.21.ffn_down.weightQ4_K[10240 2560]
-
blk.21.attn_output.biasF32[2560]
-
blk.21.attn_output.weightQ4_K[2560 2560]
-
blk.21.attn_k.biasF32[2560]
-
blk.21.attn_k.weightQ3_K[2560 2560]
-
blk.21.attn_q.biasF32[2560]
-
blk.21.attn_q.weightQ3_K[2560 2560]
-
blk.21.attn_v.biasF32[2560]
-
blk.21.attn_v.weightQ4_K[2560 2560]
-
blk.22.attn_norm.biasF32[2560]
-
blk.22.attn_norm.weightF32[2560]
-
blk.22.ffn_up.biasF32[10240]
-
blk.22.ffn_up.weightQ3_K[2560 10240]
-
blk.22.ffn_down.biasF32[2560]
-
blk.22.ffn_down.weightQ4_K[10240 2560]
-
blk.22.attn_output.biasF32[2560]
-
blk.22.attn_output.weightQ4_K[2560 2560]
-
blk.22.attn_k.biasF32[2560]
-
blk.22.attn_k.weightQ3_K[2560 2560]
-
blk.22.attn_q.biasF32[2560]
-
blk.22.attn_q.weightQ3_K[2560 2560]
-
blk.22.attn_v.biasF32[2560]
-
blk.22.attn_v.weightQ4_K[2560 2560]
-
blk.23.attn_norm.biasF32[2560]
-
blk.23.attn_norm.weightF32[2560]
-
blk.23.ffn_up.biasF32[10240]
-
blk.23.ffn_up.weightQ3_K[2560 10240]
-
blk.23.ffn_down.biasF32[2560]
-
blk.23.ffn_down.weightQ4_K[10240 2560]
-
blk.23.attn_output.biasF32[2560]
-
blk.23.attn_output.weightQ4_K[2560 2560]
-
blk.23.attn_k.biasF32[2560]
-
blk.23.attn_k.weightQ3_K[2560 2560]
-
blk.23.attn_q.biasF32[2560]
-
blk.23.attn_q.weightQ3_K[2560 2560]
-
blk.23.attn_v.biasF32[2560]
-
blk.23.attn_v.weightQ4_K[2560 2560]
-
blk.24.attn_norm.biasF32[2560]
-
blk.24.attn_norm.weightF32[2560]
-
blk.24.ffn_up.biasF32[10240]
-
blk.24.ffn_up.weightQ3_K[2560 10240]
-
blk.24.ffn_down.biasF32[2560]
-
blk.24.ffn_down.weightQ4_K[10240 2560]
-
blk.24.attn_output.biasF32[2560]
-
blk.24.attn_output.weightQ4_K[2560 2560]
-
blk.24.attn_k.biasF32[2560]
-
blk.24.attn_k.weightQ3_K[2560 2560]
-
blk.24.attn_q.biasF32[2560]
-
blk.24.attn_q.weightQ3_K[2560 2560]
-
blk.24.attn_v.biasF32[2560]
-
blk.24.attn_v.weightQ4_K[2560 2560]
-
blk.25.attn_norm.biasF32[2560]
-
blk.25.attn_norm.weightF32[2560]
-
blk.25.ffn_up.biasF32[10240]
-
blk.25.ffn_up.weightQ3_K[2560 10240]
-
blk.25.ffn_down.biasF32[2560]
-
blk.25.ffn_down.weightQ4_K[10240 2560]
-
blk.25.attn_output.biasF32[2560]
-
blk.25.attn_output.weightQ4_K[2560 2560]
-
blk.25.attn_k.biasF32[2560]
-
blk.25.attn_k.weightQ3_K[2560 2560]
-
blk.25.attn_q.biasF32[2560]
-
blk.25.attn_q.weightQ3_K[2560 2560]
-
blk.25.attn_v.biasF32[2560]
-
blk.25.attn_v.weightQ4_K[2560 2560]
-
blk.26.attn_norm.biasF32[2560]
-
blk.26.attn_norm.weightF32[2560]
-
blk.26.ffn_up.biasF32[10240]
-
blk.26.ffn_up.weightQ3_K[2560 10240]
-
blk.26.ffn_down.biasF32[2560]
-
blk.26.ffn_down.weightQ4_K[10240 2560]
-
blk.26.attn_output.biasF32[2560]
-
blk.26.attn_output.weightQ4_K[2560 2560]
-
blk.26.attn_k.biasF32[2560]
-
blk.26.attn_k.weightQ3_K[2560 2560]
-
blk.26.attn_q.biasF32[2560]
-
blk.26.attn_q.weightQ3_K[2560 2560]
-
blk.26.attn_v.biasF32[2560]
-
blk.26.attn_v.weightQ4_K[2560 2560]
-
blk.27.attn_norm.biasF32[2560]
-
blk.27.attn_norm.weightF32[2560]
-
blk.27.ffn_up.biasF32[10240]
-
blk.27.ffn_up.weightQ3_K[2560 10240]
-
blk.27.ffn_down.biasF32[2560]
-
blk.27.ffn_down.weightQ4_K[10240 2560]
-
blk.27.attn_output.biasF32[2560]
-
blk.27.attn_output.weightQ4_K[2560 2560]
-
blk.27.attn_k.biasF32[2560]
-
blk.27.attn_k.weightQ3_K[2560 2560]
-
blk.27.attn_q.biasF32[2560]
-
blk.27.attn_q.weightQ3_K[2560 2560]
-
blk.27.attn_v.biasF32[2560]
-
blk.27.attn_v.weightQ4_K[2560 2560]
-
blk.28.attn_norm.biasF32[2560]
-
blk.28.attn_norm.weightF32[2560]
-
blk.28.ffn_up.biasF32[10240]
-
blk.28.ffn_up.weightQ3_K[2560 10240]
-
blk.28.ffn_down.biasF32[2560]
-
blk.28.ffn_down.weightQ4_K[10240 2560]
-
blk.28.attn_output.biasF32[2560]
-
blk.28.attn_output.weightQ4_K[2560 2560]
-
blk.28.attn_k.biasF32[2560]
-
blk.28.attn_k.weightQ3_K[2560 2560]
-
blk.28.attn_q.biasF32[2560]
-
blk.28.attn_q.weightQ3_K[2560 2560]
-
blk.28.attn_v.biasF32[2560]
-
blk.28.attn_v.weightQ4_K[2560 2560]
-
blk.29.attn_norm.biasF32[2560]
-
blk.29.attn_norm.weightF32[2560]
-
blk.29.ffn_up.biasF32[10240]
-
blk.29.ffn_up.weightQ3_K[2560 10240]
-
blk.29.ffn_down.biasF32[2560]
-
blk.29.ffn_down.weightQ4_K[10240 2560]
-
blk.29.attn_output.biasF32[2560]
-
blk.29.attn_output.weightQ4_K[2560 2560]
-
blk.29.attn_k.biasF32[2560]
-
blk.29.attn_k.weightQ3_K[2560 2560]
-
blk.29.attn_q.biasF32[2560]
-
blk.29.attn_q.weightQ3_K[2560 2560]
-
blk.29.attn_v.biasF32[2560]
-
blk.29.attn_v.weightQ4_K[2560 2560]
-
blk.30.attn_q.biasF32[2560]
-
blk.30.attn_q.weightQ3_K[2560 2560]
-
blk.30.attn_norm.biasF32[2560]
-
blk.30.attn_norm.weightF32[2560]
-
blk.30.ffn_up.biasF32[10240]
-
blk.30.ffn_up.weightQ3_K[2560 10240]
-
blk.30.ffn_down.biasF32[2560]
-
blk.30.ffn_down.weightQ4_K[10240 2560]
-
blk.30.attn_output.biasF32[2560]
-
blk.30.attn_output.weightQ4_K[2560 2560]
-
blk.30.attn_k.biasF32[2560]
-
blk.30.attn_k.weightQ3_K[2560 2560]
-
blk.30.attn_v.biasF32[2560]
-
blk.30.attn_v.weightQ4_K[2560 2560]
-
blk.31.attn_norm.biasF32[2560]
-
blk.31.attn_norm.weightF32[2560]
-
blk.31.ffn_up.biasF32[10240]
-
blk.31.ffn_up.weightQ3_K[2560 10240]
-
blk.31.ffn_down.biasF32[2560]
-
blk.31.ffn_down.weightQ4_K[10240 2560]
-
blk.31.attn_output.biasF32[2560]
-
blk.31.attn_output.weightQ4_K[2560 2560]
-
blk.31.attn_k.biasF32[2560]
-
blk.31.attn_k.weightQ3_K[2560 2560]
-
blk.31.attn_q.biasF32[2560]
-
blk.31.attn_q.weightQ3_K[2560 2560]
-
blk.31.attn_v.biasF32[2560]
-
blk.31.attn_v.weightQ4_K[2560 2560]
-
output.biasF32[51200]
-
output.weightQ6_K[2560 51200]
-
output_norm.biasF32[2560]
-
output_norm.weightF32[2560]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31