latest
8.6GB
This is a phi3 medium model that has had the prompt rejection neurons snipped which is better than fine tuning as it doesn't change how the model acts
14B
5,127 Pulls Updated 3 months ago
43a0690f64fa · 8.6GB
-
general.architecturephi3
-
general.file_typeQ4_K_M
-
phi3.attention.head_count40
-
phi3.attention.head_count_kv10
-
phi3.attention.layer_norm_rms_epsilon1e-05
-
phi3.block_count40
-
phi3.context_length4096
-
phi3.embedding_length5120
-
phi3.feed_forward_length17920
-
phi3.rope.dimension_count128
-
phi3.rope.freq_base10000
-
phi3.rope.scaling.original_context_length4096
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id32000
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id32000
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000 -1000 -1000 0 0 ...]
-
tokenizer.ggml.token_type[3 3 4 6 6 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> <0x00> <0x01> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ4_K[5120 32064]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.ffn_down.weightQ6_K[17920 5120]
-
blk.0.ffn_up.weightQ4_K[5120 35840]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.0.attn_output.weightQ4_K[5120 5120]
-
blk.0.attn_qkv.weightQ5_K[5120 7680]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.ffn_down.weightQ6_K[17920 5120]
-
blk.1.ffn_up.weightQ4_K[5120 35840]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.attn_output.weightQ4_K[5120 5120]
-
blk.1.attn_qkv.weightQ5_K[5120 7680]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.ffn_down.weightQ6_K[17920 5120]
-
blk.2.ffn_up.weightQ4_K[5120 35840]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.2.attn_output.weightQ4_K[5120 5120]
-
blk.2.attn_qkv.weightQ5_K[5120 7680]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.ffn_down.weightQ6_K[17920 5120]
-
blk.3.ffn_up.weightQ4_K[5120 35840]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.3.attn_output.weightQ4_K[5120 5120]
-
blk.3.attn_qkv.weightQ5_K[5120 7680]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.ffn_down.weightQ6_K[17920 5120]
-
blk.4.ffn_up.weightQ4_K[5120 35840]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.4.attn_output.weightQ4_K[5120 5120]
-
blk.4.attn_qkv.weightQ5_K[5120 7680]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.ffn_down.weightQ4_K[17920 5120]
-
blk.5.ffn_up.weightQ4_K[5120 35840]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.attn_output.weightQ4_K[5120 5120]
-
blk.5.attn_qkv.weightQ5_K[5120 7680]
-
blk.6.ffn_up.weightQ4_K[5120 35840]
-
blk.6.attn_output.weightQ4_K[5120 5120]
-
blk.6.attn_qkv.weightQ5_K[5120 7680]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.ffn_down.weightQ6_K[17920 5120]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.ffn_down.weightQ4_K[17920 5120]
-
blk.7.ffn_up.weightQ4_K[5120 35840]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.attn_output.weightQ4_K[5120 5120]
-
blk.7.attn_qkv.weightQ5_K[5120 7680]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.ffn_down.weightQ4_K[17920 5120]
-
blk.8.ffn_up.weightQ4_K[5120 35840]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.8.attn_output.weightQ4_K[5120 5120]
-
blk.8.attn_qkv.weightQ5_K[5120 7680]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.ffn_down.weightQ6_K[17920 5120]
-
blk.9.ffn_up.weightQ4_K[5120 35840]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.attn_output.weightQ4_K[5120 5120]
-
blk.9.attn_qkv.weightQ5_K[5120 7680]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.ffn_down.weightQ4_K[17920 5120]
-
blk.10.ffn_up.weightQ4_K[5120 35840]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.10.attn_output.weightQ4_K[5120 5120]
-
blk.10.attn_qkv.weightQ5_K[5120 7680]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.ffn_down.weightQ6_K[17920 5120]
-
blk.11.ffn_up.weightQ4_K[5120 35840]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.attn_output.weightQ4_K[5120 5120]
-
blk.11.attn_qkv.weightQ5_K[5120 7680]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.ffn_down.weightQ4_K[17920 5120]
-
blk.12.ffn_up.weightQ4_K[5120 35840]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.12.attn_output.weightQ4_K[5120 5120]
-
blk.12.attn_qkv.weightQ5_K[5120 7680]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.ffn_down.weightQ4_K[17920 5120]
-
blk.13.ffn_up.weightQ4_K[5120 35840]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.13.attn_output.weightQ4_K[5120 5120]
-
blk.13.attn_qkv.weightQ5_K[5120 7680]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.ffn_down.weightQ4_K[17920 5120]
-
blk.14.ffn_up.weightQ4_K[5120 35840]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.14.attn_output.weightQ4_K[5120 5120]
-
blk.14.attn_qkv.weightQ5_K[5120 7680]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.ffn_down.weightQ4_K[17920 5120]
-
blk.15.ffn_up.weightQ4_K[5120 35840]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.15.attn_output.weightQ4_K[5120 5120]
-
blk.15.attn_qkv.weightQ5_K[5120 7680]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.ffn_down.weightQ6_K[17920 5120]
-
blk.16.ffn_up.weightQ4_K[5120 35840]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.16.attn_output.weightQ4_K[5120 5120]
-
blk.16.attn_qkv.weightQ5_K[5120 7680]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.ffn_down.weightQ4_K[17920 5120]
-
blk.17.ffn_up.weightQ4_K[5120 35840]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.attn_output.weightQ4_K[5120 5120]
-
blk.17.attn_qkv.weightQ5_K[5120 7680]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.ffn_down.weightQ4_K[17920 5120]
-
blk.18.ffn_up.weightQ4_K[5120 35840]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.18.attn_output.weightQ4_K[5120 5120]
-
blk.18.attn_qkv.weightQ5_K[5120 7680]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.ffn_down.weightQ6_K[17920 5120]
-
blk.19.ffn_up.weightQ4_K[5120 35840]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.attn_output.weightQ4_K[5120 5120]
-
blk.19.attn_qkv.weightQ5_K[5120 7680]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.ffn_down.weightQ4_K[17920 5120]
-
blk.20.ffn_up.weightQ4_K[5120 35840]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.20.attn_output.weightQ4_K[5120 5120]
-
blk.20.attn_qkv.weightQ5_K[5120 7680]
-
blk.21.attn_output.weightQ4_K[5120 5120]
-
blk.21.attn_qkv.weightQ5_K[5120 7680]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.ffn_down.weightQ4_K[17920 5120]
-
blk.21.ffn_up.weightQ4_K[5120 35840]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.ffn_down.weightQ6_K[17920 5120]
-
blk.22.ffn_up.weightQ4_K[5120 35840]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.22.attn_output.weightQ4_K[5120 5120]
-
blk.22.attn_qkv.weightQ5_K[5120 7680]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.ffn_down.weightQ4_K[17920 5120]
-
blk.23.ffn_up.weightQ4_K[5120 35840]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.23.attn_output.weightQ4_K[5120 5120]
-
blk.23.attn_qkv.weightQ5_K[5120 7680]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.ffn_down.weightQ4_K[17920 5120]
-
blk.24.ffn_up.weightQ4_K[5120 35840]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.24.attn_output.weightQ4_K[5120 5120]
-
blk.24.attn_qkv.weightQ5_K[5120 7680]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.ffn_down.weightQ6_K[17920 5120]
-
blk.25.ffn_up.weightQ4_K[5120 35840]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.attn_output.weightQ4_K[5120 5120]
-
blk.25.attn_qkv.weightQ5_K[5120 7680]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.ffn_down.weightQ4_K[17920 5120]
-
blk.26.ffn_up.weightQ4_K[5120 35840]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.26.attn_output.weightQ4_K[5120 5120]
-
blk.26.attn_qkv.weightQ5_K[5120 7680]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.ffn_down.weightQ4_K[17920 5120]
-
blk.27.ffn_up.weightQ4_K[5120 35840]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.attn_output.weightQ4_K[5120 5120]
-
blk.27.attn_qkv.weightQ5_K[5120 7680]
-
blk.28.attn_output.weightQ4_K[5120 5120]
-
blk.28.attn_qkv.weightQ5_K[5120 7680]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.ffn_down.weightQ6_K[17920 5120]
-
blk.28.ffn_up.weightQ4_K[5120 35840]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.ffn_down.weightQ4_K[17920 5120]
-
blk.29.ffn_up.weightQ4_K[5120 35840]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.attn_output.weightQ4_K[5120 5120]
-
blk.29.attn_qkv.weightQ5_K[5120 7680]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.ffn_down.weightQ4_K[17920 5120]
-
blk.30.ffn_up.weightQ4_K[5120 35840]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.30.attn_output.weightQ4_K[5120 5120]
-
blk.30.attn_qkv.weightQ5_K[5120 7680]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.ffn_down.weightQ6_K[17920 5120]
-
blk.31.ffn_up.weightQ4_K[5120 35840]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.attn_output.weightQ4_K[5120 5120]
-
blk.31.attn_qkv.weightQ5_K[5120 7680]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.ffn_down.weightQ4_K[17920 5120]
-
blk.32.ffn_up.weightQ4_K[5120 35840]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.32.attn_output.weightQ4_K[5120 5120]
-
blk.32.attn_qkv.weightQ5_K[5120 7680]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.ffn_down.weightQ4_K[17920 5120]
-
blk.33.ffn_up.weightQ4_K[5120 35840]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.33.attn_output.weightQ4_K[5120 5120]
-
blk.33.attn_qkv.weightQ5_K[5120 7680]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.ffn_down.weightQ6_K[17920 5120]
-
blk.34.ffn_up.weightQ4_K[5120 35840]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.34.attn_output.weightQ4_K[5120 5120]
-
blk.34.attn_qkv.weightQ5_K[5120 7680]
-
blk.35.attn_output.weightQ4_K[5120 5120]
-
blk.35.attn_qkv.weightQ5_K[5120 7680]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.ffn_down.weightQ6_K[17920 5120]
-
blk.35.ffn_up.weightQ4_K[5120 35840]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.ffn_down.weightQ6_K[17920 5120]
-
blk.36.ffn_up.weightQ4_K[5120 35840]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.36.attn_output.weightQ4_K[5120 5120]
-
blk.36.attn_qkv.weightQ5_K[5120 7680]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.ffn_down.weightQ6_K[17920 5120]
-
blk.37.ffn_up.weightQ4_K[5120 35840]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.attn_output.weightQ4_K[5120 5120]
-
blk.37.attn_qkv.weightQ5_K[5120 7680]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.ffn_down.weightQ6_K[17920 5120]
-
blk.38.ffn_up.weightQ4_K[5120 35840]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.38.attn_output.weightQ4_K[5120 5120]
-
blk.38.attn_qkv.weightQ5_K[5120 7680]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.ffn_down.weightQ6_K[17920 5120]
-
blk.39.ffn_up.weightQ4_K[5120 35840]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.attn_output.weightQ4_K[5120 5120]
-
blk.39.attn_qkv.weightQ5_K[5120 7680]
-
output.weightQ6_K[5120 32064]
-
output_norm.weightF32[5120]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39