yanolja eeve korean model
3B
208 Pulls Updated 3 months ago
1df6daac0b60 · 1.8GB
-
general.architecturephi2
-
general.file_typeQ4_K_M
-
phi2.attention.head_count32
-
phi2.attention.head_count_kv32
-
phi2.attention.layer_norm_epsilon1e-05
-
phi2.block_count32
-
phi2.context_length2048
-
phi2.embedding_length2560
-
phi2.feed_forward_length10240
-
phi2.rope.dimension_count32
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id58940
-
tokenizer.ggml.eos_token_id58943
-
tokenizer.ggml.merges[▁ ▁ ▁ ▁▁ ▁▁ ▁ ▁ ▁▁▁ ▁▁ ▁▁ ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id58941
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
tokenizer.ggml.unknown_token_id50256
-
NameTypeShape
-
token_embd.weightQ4_K[2560 58944]
-
blk.0.attn_norm.biasF32[2560]
-
blk.0.attn_norm.weightF32[2560]
-
blk.0.ffn_up.biasF32[10240]
-
blk.0.ffn_up.weightQ4_K[2560 10240]
-
blk.0.ffn_down.biasF32[2560]
-
blk.0.ffn_down.weightQ6_K[10240 2560]
-
blk.0.attn_output.biasF32[2560]
-
blk.0.attn_output.weightQ4_K[2560 2560]
-
blk.0.attn_k.biasF32[2560]
-
blk.0.attn_k.weightQ4_K[2560 2560]
-
blk.0.attn_q.biasF32[2560]
-
blk.0.attn_q.weightQ4_K[2560 2560]
-
blk.0.attn_v.biasF32[2560]
-
blk.0.attn_v.weightQ6_K[2560 2560]
-
blk.1.attn_norm.biasF32[2560]
-
blk.1.attn_norm.weightF32[2560]
-
blk.1.ffn_up.biasF32[10240]
-
blk.1.ffn_up.weightQ4_K[2560 10240]
-
blk.1.ffn_down.biasF32[2560]
-
blk.1.ffn_down.weightQ6_K[10240 2560]
-
blk.1.attn_output.biasF32[2560]
-
blk.1.attn_output.weightQ4_K[2560 2560]
-
blk.1.attn_k.biasF32[2560]
-
blk.1.attn_k.weightQ4_K[2560 2560]
-
blk.1.attn_q.biasF32[2560]
-
blk.1.attn_q.weightQ4_K[2560 2560]
-
blk.1.attn_v.biasF32[2560]
-
blk.1.attn_v.weightQ6_K[2560 2560]
-
blk.2.attn_norm.biasF32[2560]
-
blk.2.attn_norm.weightF32[2560]
-
blk.2.ffn_up.biasF32[10240]
-
blk.2.ffn_up.weightQ4_K[2560 10240]
-
blk.2.ffn_down.biasF32[2560]
-
blk.2.ffn_down.weightQ6_K[10240 2560]
-
blk.2.attn_output.biasF32[2560]
-
blk.2.attn_output.weightQ4_K[2560 2560]
-
blk.2.attn_k.biasF32[2560]
-
blk.2.attn_k.weightQ4_K[2560 2560]
-
blk.2.attn_q.biasF32[2560]
-
blk.2.attn_q.weightQ4_K[2560 2560]
-
blk.2.attn_v.biasF32[2560]
-
blk.2.attn_v.weightQ6_K[2560 2560]
-
blk.3.attn_norm.biasF32[2560]
-
blk.3.attn_norm.weightF32[2560]
-
blk.3.ffn_up.biasF32[10240]
-
blk.3.ffn_up.weightQ4_K[2560 10240]
-
blk.3.ffn_down.biasF32[2560]
-
blk.3.ffn_down.weightQ4_K[10240 2560]
-
blk.3.attn_output.biasF32[2560]
-
blk.3.attn_output.weightQ4_K[2560 2560]
-
blk.3.attn_k.biasF32[2560]
-
blk.3.attn_k.weightQ4_K[2560 2560]
-
blk.3.attn_q.biasF32[2560]
-
blk.3.attn_q.weightQ4_K[2560 2560]
-
blk.3.attn_v.biasF32[2560]
-
blk.3.attn_v.weightQ4_K[2560 2560]
-
blk.4.attn_norm.biasF32[2560]
-
blk.4.attn_norm.weightF32[2560]
-
blk.4.ffn_up.biasF32[10240]
-
blk.4.ffn_up.weightQ4_K[2560 10240]
-
blk.4.ffn_down.biasF32[2560]
-
blk.4.ffn_down.weightQ4_K[10240 2560]
-
blk.4.attn_output.biasF32[2560]
-
blk.4.attn_output.weightQ4_K[2560 2560]
-
blk.4.attn_k.biasF32[2560]
-
blk.4.attn_k.weightQ4_K[2560 2560]
-
blk.4.attn_q.biasF32[2560]
-
blk.4.attn_q.weightQ4_K[2560 2560]
-
blk.4.attn_v.biasF32[2560]
-
blk.4.attn_v.weightQ6_K[2560 2560]
-
blk.5.attn_norm.biasF32[2560]
-
blk.5.attn_norm.weightF32[2560]
-
blk.5.ffn_up.biasF32[10240]
-
blk.5.ffn_up.weightQ4_K[2560 10240]
-
blk.5.ffn_down.biasF32[2560]
-
blk.5.ffn_down.weightQ6_K[10240 2560]
-
blk.5.attn_output.biasF32[2560]
-
blk.5.attn_output.weightQ4_K[2560 2560]
-
blk.5.attn_k.biasF32[2560]
-
blk.5.attn_k.weightQ4_K[2560 2560]
-
blk.5.attn_q.biasF32[2560]
-
blk.5.attn_q.weightQ4_K[2560 2560]
-
blk.5.attn_v.biasF32[2560]
-
blk.5.attn_v.weightQ4_K[2560 2560]
-
blk.6.attn_norm.biasF32[2560]
-
blk.6.attn_norm.weightF32[2560]
-
blk.6.ffn_up.biasF32[10240]
-
blk.6.ffn_up.weightQ4_K[2560 10240]
-
blk.6.ffn_down.biasF32[2560]
-
blk.6.ffn_down.weightQ4_K[10240 2560]
-
blk.6.attn_output.biasF32[2560]
-
blk.6.attn_output.weightQ4_K[2560 2560]
-
blk.6.attn_k.biasF32[2560]
-
blk.6.attn_k.weightQ4_K[2560 2560]
-
blk.6.attn_q.biasF32[2560]
-
blk.6.attn_q.weightQ4_K[2560 2560]
-
blk.6.attn_v.biasF32[2560]
-
blk.6.attn_v.weightQ4_K[2560 2560]
-
blk.7.attn_norm.biasF32[2560]
-
blk.7.attn_norm.weightF32[2560]
-
blk.7.ffn_up.biasF32[10240]
-
blk.7.ffn_up.weightQ4_K[2560 10240]
-
blk.7.ffn_down.biasF32[2560]
-
blk.7.ffn_down.weightQ4_K[10240 2560]
-
blk.7.attn_output.biasF32[2560]
-
blk.7.attn_output.weightQ4_K[2560 2560]
-
blk.7.attn_k.biasF32[2560]
-
blk.7.attn_k.weightQ4_K[2560 2560]
-
blk.7.attn_q.biasF32[2560]
-
blk.7.attn_q.weightQ4_K[2560 2560]
-
blk.7.attn_v.biasF32[2560]
-
blk.7.attn_v.weightQ6_K[2560 2560]
-
blk.8.attn_norm.biasF32[2560]
-
blk.8.attn_norm.weightF32[2560]
-
blk.8.ffn_up.biasF32[10240]
-
blk.8.ffn_up.weightQ4_K[2560 10240]
-
blk.8.ffn_down.biasF32[2560]
-
blk.8.ffn_down.weightQ6_K[10240 2560]
-
blk.8.attn_output.biasF32[2560]
-
blk.8.attn_output.weightQ4_K[2560 2560]
-
blk.8.attn_k.biasF32[2560]
-
blk.8.attn_k.weightQ4_K[2560 2560]
-
blk.8.attn_q.biasF32[2560]
-
blk.8.attn_q.weightQ4_K[2560 2560]
-
blk.8.attn_v.biasF32[2560]
-
blk.8.attn_v.weightQ6_K[2560 2560]
-
blk.9.attn_norm.biasF32[2560]
-
blk.9.attn_norm.weightF32[2560]
-
blk.9.ffn_up.biasF32[10240]
-
blk.9.ffn_up.weightQ4_K[2560 10240]
-
blk.9.ffn_down.biasF32[2560]
-
blk.9.ffn_down.weightQ6_K[10240 2560]
-
blk.9.attn_output.biasF32[2560]
-
blk.9.attn_output.weightQ4_K[2560 2560]
-
blk.9.attn_k.biasF32[2560]
-
blk.9.attn_k.weightQ4_K[2560 2560]
-
blk.9.attn_q.biasF32[2560]
-
blk.9.attn_q.weightQ4_K[2560 2560]
-
blk.9.attn_v.biasF32[2560]
-
blk.9.attn_v.weightQ6_K[2560 2560]
-
blk.10.attn_norm.biasF32[2560]
-
blk.10.attn_norm.weightF32[2560]
-
blk.10.ffn_up.biasF32[10240]
-
blk.10.ffn_up.weightQ4_K[2560 10240]
-
blk.10.ffn_down.biasF32[2560]
-
blk.10.ffn_down.weightQ6_K[10240 2560]
-
blk.10.attn_output.biasF32[2560]
-
blk.10.attn_output.weightQ4_K[2560 2560]
-
blk.10.attn_k.biasF32[2560]
-
blk.10.attn_k.weightQ4_K[2560 2560]
-
blk.10.attn_q.biasF32[2560]
-
blk.10.attn_q.weightQ4_K[2560 2560]
-
blk.10.attn_v.biasF32[2560]
-
blk.10.attn_v.weightQ6_K[2560 2560]
-
blk.11.attn_norm.biasF32[2560]
-
blk.11.attn_norm.weightF32[2560]
-
blk.11.ffn_up.biasF32[10240]
-
blk.11.ffn_up.weightQ4_K[2560 10240]
-
blk.11.ffn_down.biasF32[2560]
-
blk.11.ffn_down.weightQ6_K[10240 2560]
-
blk.11.attn_output.biasF32[2560]
-
blk.11.attn_output.weightQ4_K[2560 2560]
-
blk.11.attn_k.biasF32[2560]
-
blk.11.attn_k.weightQ4_K[2560 2560]
-
blk.11.attn_q.biasF32[2560]
-
blk.11.attn_q.weightQ4_K[2560 2560]
-
blk.11.attn_v.biasF32[2560]
-
blk.11.attn_v.weightQ6_K[2560 2560]
-
blk.12.attn_norm.biasF32[2560]
-
blk.12.attn_norm.weightF32[2560]
-
blk.12.ffn_up.biasF32[10240]
-
blk.12.ffn_up.weightQ4_K[2560 10240]
-
blk.12.ffn_down.biasF32[2560]
-
blk.12.ffn_down.weightQ4_K[10240 2560]
-
blk.12.attn_output.biasF32[2560]
-
blk.12.attn_output.weightQ4_K[2560 2560]
-
blk.12.attn_k.biasF32[2560]
-
blk.12.attn_k.weightQ4_K[2560 2560]
-
blk.12.attn_q.biasF32[2560]
-
blk.12.attn_q.weightQ4_K[2560 2560]
-
blk.12.attn_v.biasF32[2560]
-
blk.12.attn_v.weightQ4_K[2560 2560]
-
blk.13.attn_norm.biasF32[2560]
-
blk.13.attn_norm.weightF32[2560]
-
blk.13.ffn_up.biasF32[10240]
-
blk.13.ffn_up.weightQ4_K[2560 10240]
-
blk.13.ffn_down.biasF32[2560]
-
blk.13.ffn_down.weightQ4_K[10240 2560]
-
blk.13.attn_output.biasF32[2560]
-
blk.13.attn_output.weightQ4_K[2560 2560]
-
blk.13.attn_k.biasF32[2560]
-
blk.13.attn_k.weightQ4_K[2560 2560]
-
blk.13.attn_q.biasF32[2560]
-
blk.13.attn_q.weightQ4_K[2560 2560]
-
blk.13.attn_v.biasF32[2560]
-
blk.13.attn_v.weightQ4_K[2560 2560]
-
blk.14.attn_norm.biasF32[2560]
-
blk.14.attn_norm.weightF32[2560]
-
blk.14.ffn_up.biasF32[10240]
-
blk.14.ffn_up.weightQ4_K[2560 10240]
-
blk.14.ffn_down.biasF32[2560]
-
blk.14.ffn_down.weightQ6_K[10240 2560]
-
blk.14.attn_output.biasF32[2560]
-
blk.14.attn_output.weightQ4_K[2560 2560]
-
blk.14.attn_k.biasF32[2560]
-
blk.14.attn_k.weightQ4_K[2560 2560]
-
blk.14.attn_q.biasF32[2560]
-
blk.14.attn_q.weightQ4_K[2560 2560]
-
blk.14.attn_v.biasF32[2560]
-
blk.14.attn_v.weightQ6_K[2560 2560]
-
blk.15.attn_norm.biasF32[2560]
-
blk.15.attn_norm.weightF32[2560]
-
blk.15.ffn_up.biasF32[10240]
-
blk.15.ffn_up.weightQ4_K[2560 10240]
-
blk.15.ffn_down.biasF32[2560]
-
blk.15.ffn_down.weightQ4_K[10240 2560]
-
blk.15.attn_output.biasF32[2560]
-
blk.15.attn_output.weightQ4_K[2560 2560]
-
blk.15.attn_k.biasF32[2560]
-
blk.15.attn_k.weightQ4_K[2560 2560]
-
blk.15.attn_q.biasF32[2560]
-
blk.15.attn_q.weightQ4_K[2560 2560]
-
blk.15.attn_v.biasF32[2560]
-
blk.15.attn_v.weightQ4_K[2560 2560]
-
blk.16.attn_norm.biasF32[2560]
-
blk.16.attn_norm.weightF32[2560]
-
blk.16.ffn_up.biasF32[10240]
-
blk.16.ffn_up.weightQ4_K[2560 10240]
-
blk.16.ffn_down.biasF32[2560]
-
blk.16.ffn_down.weightQ4_K[10240 2560]
-
blk.16.attn_output.biasF32[2560]
-
blk.16.attn_output.weightQ4_K[2560 2560]
-
blk.16.attn_k.biasF32[2560]
-
blk.16.attn_k.weightQ4_K[2560 2560]
-
blk.16.attn_q.biasF32[2560]
-
blk.16.attn_q.weightQ4_K[2560 2560]
-
blk.16.attn_v.biasF32[2560]
-
blk.16.attn_v.weightQ4_K[2560 2560]
-
blk.17.attn_norm.biasF32[2560]
-
blk.17.attn_norm.weightF32[2560]
-
blk.17.ffn_up.biasF32[10240]
-
blk.17.ffn_up.weightQ4_K[2560 10240]
-
blk.17.ffn_down.biasF32[2560]
-
blk.17.ffn_down.weightQ6_K[10240 2560]
-
blk.17.attn_output.biasF32[2560]
-
blk.17.attn_output.weightQ4_K[2560 2560]
-
blk.17.attn_k.biasF32[2560]
-
blk.17.attn_k.weightQ4_K[2560 2560]
-
blk.17.attn_q.biasF32[2560]
-
blk.17.attn_q.weightQ4_K[2560 2560]
-
blk.17.attn_v.biasF32[2560]
-
blk.17.attn_v.weightQ6_K[2560 2560]
-
blk.18.attn_norm.biasF32[2560]
-
blk.18.attn_norm.weightF32[2560]
-
blk.18.ffn_up.biasF32[10240]
-
blk.18.ffn_up.weightQ4_K[2560 10240]
-
blk.18.ffn_down.biasF32[2560]
-
blk.18.ffn_down.weightQ4_K[10240 2560]
-
blk.18.attn_output.biasF32[2560]
-
blk.18.attn_output.weightQ4_K[2560 2560]
-
blk.18.attn_k.biasF32[2560]
-
blk.18.attn_k.weightQ4_K[2560 2560]
-
blk.18.attn_q.biasF32[2560]
-
blk.18.attn_q.weightQ4_K[2560 2560]
-
blk.18.attn_v.biasF32[2560]
-
blk.18.attn_v.weightQ4_K[2560 2560]
-
blk.19.attn_norm.biasF32[2560]
-
blk.19.attn_norm.weightF32[2560]
-
blk.19.ffn_up.biasF32[10240]
-
blk.19.ffn_up.weightQ4_K[2560 10240]
-
blk.19.ffn_down.biasF32[2560]
-
blk.19.ffn_down.weightQ4_K[10240 2560]
-
blk.19.attn_output.biasF32[2560]
-
blk.19.attn_output.weightQ4_K[2560 2560]
-
blk.19.attn_k.biasF32[2560]
-
blk.19.attn_k.weightQ4_K[2560 2560]
-
blk.19.attn_q.biasF32[2560]
-
blk.19.attn_q.weightQ4_K[2560 2560]
-
blk.19.attn_v.biasF32[2560]
-
blk.19.attn_v.weightQ4_K[2560 2560]
-
blk.20.attn_norm.biasF32[2560]
-
blk.20.attn_norm.weightF32[2560]
-
blk.20.ffn_up.biasF32[10240]
-
blk.20.ffn_up.weightQ4_K[2560 10240]
-
blk.20.ffn_down.biasF32[2560]
-
blk.20.ffn_down.weightQ4_K[10240 2560]
-
blk.20.attn_output.biasF32[2560]
-
blk.20.attn_output.weightQ4_K[2560 2560]
-
blk.20.attn_k.biasF32[2560]
-
blk.20.attn_k.weightQ4_K[2560 2560]
-
blk.20.attn_q.biasF32[2560]
-
blk.20.attn_q.weightQ4_K[2560 2560]
-
blk.20.attn_v.biasF32[2560]
-
blk.20.attn_v.weightQ4_K[2560 2560]
-
blk.21.attn_norm.biasF32[2560]
-
blk.21.attn_norm.weightF32[2560]
-
blk.21.ffn_up.biasF32[10240]
-
blk.21.ffn_up.weightQ4_K[2560 10240]
-
blk.21.ffn_down.biasF32[2560]
-
blk.21.ffn_down.weightQ4_K[10240 2560]
-
blk.21.attn_output.biasF32[2560]
-
blk.21.attn_output.weightQ4_K[2560 2560]
-
blk.21.attn_k.biasF32[2560]
-
blk.21.attn_k.weightQ4_K[2560 2560]
-
blk.21.attn_q.biasF32[2560]
-
blk.21.attn_q.weightQ4_K[2560 2560]
-
blk.21.attn_v.biasF32[2560]
-
blk.21.attn_v.weightQ4_K[2560 2560]
-
blk.22.attn_norm.biasF32[2560]
-
blk.22.attn_norm.weightF32[2560]
-
blk.22.ffn_up.biasF32[10240]
-
blk.22.ffn_up.weightQ4_K[2560 10240]
-
blk.22.ffn_down.biasF32[2560]
-
blk.22.ffn_down.weightQ6_K[10240 2560]
-
blk.22.attn_output.biasF32[2560]
-
blk.22.attn_output.weightQ4_K[2560 2560]
-
blk.22.attn_k.biasF32[2560]
-
blk.22.attn_k.weightQ4_K[2560 2560]
-
blk.22.attn_q.biasF32[2560]
-
blk.22.attn_q.weightQ4_K[2560 2560]
-
blk.22.attn_v.biasF32[2560]
-
blk.22.attn_v.weightQ6_K[2560 2560]
-
blk.23.attn_norm.biasF32[2560]
-
blk.23.attn_norm.weightF32[2560]
-
blk.23.ffn_up.biasF32[10240]
-
blk.23.ffn_up.weightQ4_K[2560 10240]
-
blk.23.ffn_down.biasF32[2560]
-
blk.23.ffn_down.weightQ4_K[10240 2560]
-
blk.23.attn_output.biasF32[2560]
-
blk.23.attn_output.weightQ4_K[2560 2560]
-
blk.23.attn_k.biasF32[2560]
-
blk.23.attn_k.weightQ4_K[2560 2560]
-
blk.23.attn_q.biasF32[2560]
-
blk.23.attn_q.weightQ4_K[2560 2560]
-
blk.23.attn_v.biasF32[2560]
-
blk.23.attn_v.weightQ4_K[2560 2560]
-
blk.24.attn_norm.biasF32[2560]
-
blk.24.attn_norm.weightF32[2560]
-
blk.24.ffn_up.biasF32[10240]
-
blk.24.ffn_up.weightQ4_K[2560 10240]
-
blk.24.ffn_down.biasF32[2560]
-
blk.24.ffn_down.weightQ4_K[10240 2560]
-
blk.24.attn_output.biasF32[2560]
-
blk.24.attn_output.weightQ4_K[2560 2560]
-
blk.24.attn_k.biasF32[2560]
-
blk.24.attn_k.weightQ4_K[2560 2560]
-
blk.24.attn_q.biasF32[2560]
-
blk.24.attn_q.weightQ4_K[2560 2560]
-
blk.24.attn_v.biasF32[2560]
-
blk.24.attn_v.weightQ4_K[2560 2560]
-
blk.25.attn_norm.biasF32[2560]
-
blk.25.attn_norm.weightF32[2560]
-
blk.25.ffn_up.biasF32[10240]
-
blk.25.ffn_up.weightQ4_K[2560 10240]
-
blk.25.ffn_down.biasF32[2560]
-
blk.25.ffn_down.weightQ6_K[10240 2560]
-
blk.25.attn_output.biasF32[2560]
-
blk.25.attn_output.weightQ4_K[2560 2560]
-
blk.25.attn_k.biasF32[2560]
-
blk.25.attn_k.weightQ4_K[2560 2560]
-
blk.25.attn_q.biasF32[2560]
-
blk.25.attn_q.weightQ4_K[2560 2560]
-
blk.25.attn_v.biasF32[2560]
-
blk.25.attn_v.weightQ6_K[2560 2560]
-
blk.26.attn_norm.biasF32[2560]
-
blk.26.attn_norm.weightF32[2560]
-
blk.26.ffn_up.biasF32[10240]
-
blk.26.ffn_up.weightQ4_K[2560 10240]
-
blk.26.ffn_down.biasF32[2560]
-
blk.26.ffn_down.weightQ4_K[10240 2560]
-
blk.26.attn_output.biasF32[2560]
-
blk.26.attn_output.weightQ4_K[2560 2560]
-
blk.26.attn_k.biasF32[2560]
-
blk.26.attn_k.weightQ4_K[2560 2560]
-
blk.26.attn_q.biasF32[2560]
-
blk.26.attn_q.weightQ4_K[2560 2560]
-
blk.26.attn_v.biasF32[2560]
-
blk.26.attn_v.weightQ4_K[2560 2560]
-
blk.27.attn_norm.biasF32[2560]
-
blk.27.attn_norm.weightF32[2560]
-
blk.27.ffn_up.biasF32[10240]
-
blk.27.ffn_up.weightQ4_K[2560 10240]
-
blk.27.ffn_down.biasF32[2560]
-
blk.27.ffn_down.weightQ4_K[10240 2560]
-
blk.27.attn_output.biasF32[2560]
-
blk.27.attn_output.weightQ4_K[2560 2560]
-
blk.27.attn_k.biasF32[2560]
-
blk.27.attn_k.weightQ4_K[2560 2560]
-
blk.27.attn_q.biasF32[2560]
-
blk.27.attn_q.weightQ4_K[2560 2560]
-
blk.27.attn_v.biasF32[2560]
-
blk.27.attn_v.weightQ4_K[2560 2560]
-
blk.28.attn_norm.biasF32[2560]
-
blk.28.attn_norm.weightF32[2560]
-
blk.28.ffn_up.biasF32[10240]
-
blk.28.ffn_up.weightQ4_K[2560 10240]
-
blk.28.ffn_down.biasF32[2560]
-
blk.28.ffn_down.weightQ6_K[10240 2560]
-
blk.28.attn_output.biasF32[2560]
-
blk.28.attn_output.weightQ4_K[2560 2560]
-
blk.28.attn_k.biasF32[2560]
-
blk.28.attn_k.weightQ4_K[2560 2560]
-
blk.28.attn_q.biasF32[2560]
-
blk.28.attn_q.weightQ4_K[2560 2560]
-
blk.28.attn_v.biasF32[2560]
-
blk.28.attn_v.weightQ6_K[2560 2560]
-
blk.29.ffn_up.biasF32[10240]
-
blk.29.ffn_up.weightQ4_K[2560 10240]
-
blk.29.attn_output.biasF32[2560]
-
blk.29.attn_output.weightQ4_K[2560 2560]
-
blk.29.attn_k.biasF32[2560]
-
blk.29.attn_k.weightQ4_K[2560 2560]
-
blk.29.attn_q.biasF32[2560]
-
blk.29.attn_q.weightQ4_K[2560 2560]
-
blk.29.attn_v.biasF32[2560]
-
blk.29.attn_v.weightQ4_K[2560 2560]
-
blk.29.attn_norm.biasF32[2560]
-
blk.29.attn_norm.weightF32[2560]
-
blk.29.ffn_down.biasF32[2560]
-
blk.29.ffn_down.weightQ6_K[10240 2560]
-
blk.30.attn_norm.biasF32[2560]
-
blk.30.attn_norm.weightF32[2560]
-
blk.30.ffn_up.biasF32[10240]
-
blk.30.ffn_up.weightQ4_K[2560 10240]
-
blk.30.ffn_down.biasF32[2560]
-
blk.30.ffn_down.weightQ6_K[10240 2560]
-
blk.30.attn_output.biasF32[2560]
-
blk.30.attn_output.weightQ4_K[2560 2560]
-
blk.30.attn_k.biasF32[2560]
-
blk.30.attn_k.weightQ4_K[2560 2560]
-
blk.30.attn_q.biasF32[2560]
-
blk.30.attn_q.weightQ4_K[2560 2560]
-
blk.30.attn_v.biasF32[2560]
-
blk.30.attn_v.weightQ6_K[2560 2560]
-
blk.31.attn_norm.biasF32[2560]
-
blk.31.attn_norm.weightF32[2560]
-
blk.31.ffn_up.biasF32[10240]
-
blk.31.ffn_up.weightQ4_K[2560 10240]
-
blk.31.ffn_down.biasF32[2560]
-
blk.31.ffn_down.weightQ6_K[10240 2560]
-
blk.31.attn_output.biasF32[2560]
-
blk.31.attn_output.weightQ4_K[2560 2560]
-
blk.31.attn_k.biasF32[2560]
-
blk.31.attn_k.weightQ4_K[2560 2560]
-
blk.31.attn_q.biasF32[2560]
-
blk.31.attn_q.weightQ4_K[2560 2560]
-
blk.31.attn_v.biasF32[2560]
-
blk.31.attn_v.weightQ6_K[2560 2560]
-
output.biasF32[58944]
-
output.weightQ6_K[2560 58944]
-
output_norm.biasF32[2560]
-
output_norm.weightF32[2560]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31