latest
28GB
Microsoft’s Phi 3 Medium 4K Instruct
14B
64 Pulls Updated 3 months ago
893a6517f6d6 · 10GB
-
general.architecturephi3
-
general.file_typeQ5_K_M
-
phi3.attention.head_count40
-
phi3.attention.head_count_kv10
-
phi3.attention.layer_norm_rms_epsilon1e-05
-
phi3.block_count40
-
phi3.context_length4096
-
phi3.embedding_length5120
-
phi3.feed_forward_length17920
-
phi3.rope.dimension_count128
-
phi3.rope.freq_base10000
-
phi3.rope.scaling.original_context_length4096
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id32000
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id32000
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000 -1000 -1000 0 0 ...]
-
tokenizer.ggml.token_type[3 3 4 6 6 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> <0x00> <0x01> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ5_K[5120 32064]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.ffn_down.weightQ6_K[17920 5120]
-
blk.0.ffn_up.weightQ5_K[5120 35840]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.0.attn_output.weightQ5_K[5120 5120]
-
blk.0.attn_qkv.weightQ6_K[5120 7680]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.ffn_down.weightQ6_K[17920 5120]
-
blk.1.ffn_up.weightQ5_K[5120 35840]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.attn_output.weightQ5_K[5120 5120]
-
blk.1.attn_qkv.weightQ6_K[5120 7680]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.ffn_down.weightQ6_K[17920 5120]
-
blk.2.ffn_up.weightQ5_K[5120 35840]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.2.attn_output.weightQ5_K[5120 5120]
-
blk.2.attn_qkv.weightQ6_K[5120 7680]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.ffn_down.weightQ6_K[17920 5120]
-
blk.3.ffn_up.weightQ5_K[5120 35840]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.3.attn_output.weightQ5_K[5120 5120]
-
blk.3.attn_qkv.weightQ6_K[5120 7680]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.ffn_down.weightQ6_K[17920 5120]
-
blk.4.ffn_up.weightQ5_K[5120 35840]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.4.attn_output.weightQ5_K[5120 5120]
-
blk.4.attn_qkv.weightQ6_K[5120 7680]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.ffn_down.weightQ5_K[17920 5120]
-
blk.5.ffn_up.weightQ5_K[5120 35840]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.attn_output.weightQ5_K[5120 5120]
-
blk.5.attn_qkv.weightQ6_K[5120 7680]
-
blk.6.ffn_up.weightQ5_K[5120 35840]
-
blk.6.attn_output.weightQ5_K[5120 5120]
-
blk.6.attn_qkv.weightQ6_K[5120 7680]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.ffn_down.weightQ6_K[17920 5120]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.ffn_down.weightQ5_K[17920 5120]
-
blk.7.ffn_up.weightQ5_K[5120 35840]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.attn_output.weightQ5_K[5120 5120]
-
blk.7.attn_qkv.weightQ6_K[5120 7680]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.ffn_down.weightQ5_K[17920 5120]
-
blk.8.ffn_up.weightQ5_K[5120 35840]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.8.attn_output.weightQ5_K[5120 5120]
-
blk.8.attn_qkv.weightQ6_K[5120 7680]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.ffn_down.weightQ6_K[17920 5120]
-
blk.9.ffn_up.weightQ5_K[5120 35840]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.attn_output.weightQ5_K[5120 5120]
-
blk.9.attn_qkv.weightQ6_K[5120 7680]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.ffn_down.weightQ5_K[17920 5120]
-
blk.10.ffn_up.weightQ5_K[5120 35840]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.10.attn_output.weightQ5_K[5120 5120]
-
blk.10.attn_qkv.weightQ6_K[5120 7680]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.ffn_down.weightQ6_K[17920 5120]
-
blk.11.ffn_up.weightQ5_K[5120 35840]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.attn_output.weightQ5_K[5120 5120]
-
blk.11.attn_qkv.weightQ6_K[5120 7680]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.ffn_down.weightQ5_K[17920 5120]
-
blk.12.ffn_up.weightQ5_K[5120 35840]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.12.attn_output.weightQ5_K[5120 5120]
-
blk.12.attn_qkv.weightQ6_K[5120 7680]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.ffn_down.weightQ5_K[17920 5120]
-
blk.13.ffn_up.weightQ5_K[5120 35840]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.13.attn_output.weightQ5_K[5120 5120]
-
blk.13.attn_qkv.weightQ6_K[5120 7680]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.ffn_down.weightQ5_K[17920 5120]
-
blk.14.ffn_up.weightQ5_K[5120 35840]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.14.attn_output.weightQ5_K[5120 5120]
-
blk.14.attn_qkv.weightQ6_K[5120 7680]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.ffn_down.weightQ5_K[17920 5120]
-
blk.15.ffn_up.weightQ5_K[5120 35840]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.15.attn_output.weightQ5_K[5120 5120]
-
blk.15.attn_qkv.weightQ6_K[5120 7680]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.ffn_down.weightQ6_K[17920 5120]
-
blk.16.ffn_up.weightQ5_K[5120 35840]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.16.attn_output.weightQ5_K[5120 5120]
-
blk.16.attn_qkv.weightQ6_K[5120 7680]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.ffn_down.weightQ5_K[17920 5120]
-
blk.17.ffn_up.weightQ5_K[5120 35840]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.attn_output.weightQ5_K[5120 5120]
-
blk.17.attn_qkv.weightQ6_K[5120 7680]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.ffn_down.weightQ5_K[17920 5120]
-
blk.18.ffn_up.weightQ5_K[5120 35840]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.18.attn_output.weightQ5_K[5120 5120]
-
blk.18.attn_qkv.weightQ6_K[5120 7680]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.ffn_down.weightQ6_K[17920 5120]
-
blk.19.ffn_up.weightQ5_K[5120 35840]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.attn_output.weightQ5_K[5120 5120]
-
blk.19.attn_qkv.weightQ6_K[5120 7680]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.ffn_down.weightQ5_K[17920 5120]
-
blk.20.ffn_up.weightQ5_K[5120 35840]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.20.attn_output.weightQ5_K[5120 5120]
-
blk.20.attn_qkv.weightQ6_K[5120 7680]
-
blk.21.attn_output.weightQ5_K[5120 5120]
-
blk.21.attn_qkv.weightQ6_K[5120 7680]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.ffn_down.weightQ5_K[17920 5120]
-
blk.21.ffn_up.weightQ5_K[5120 35840]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.ffn_down.weightQ6_K[17920 5120]
-
blk.22.ffn_up.weightQ5_K[5120 35840]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.22.attn_output.weightQ5_K[5120 5120]
-
blk.22.attn_qkv.weightQ6_K[5120 7680]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.ffn_down.weightQ5_K[17920 5120]
-
blk.23.ffn_up.weightQ5_K[5120 35840]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.23.attn_output.weightQ5_K[5120 5120]
-
blk.23.attn_qkv.weightQ6_K[5120 7680]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.ffn_down.weightQ5_K[17920 5120]
-
blk.24.ffn_up.weightQ5_K[5120 35840]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.24.attn_output.weightQ5_K[5120 5120]
-
blk.24.attn_qkv.weightQ6_K[5120 7680]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.ffn_down.weightQ6_K[17920 5120]
-
blk.25.ffn_up.weightQ5_K[5120 35840]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.attn_output.weightQ5_K[5120 5120]
-
blk.25.attn_qkv.weightQ6_K[5120 7680]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.ffn_down.weightQ5_K[17920 5120]
-
blk.26.ffn_up.weightQ5_K[5120 35840]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.26.attn_output.weightQ5_K[5120 5120]
-
blk.26.attn_qkv.weightQ6_K[5120 7680]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.ffn_down.weightQ5_K[17920 5120]
-
blk.27.ffn_up.weightQ5_K[5120 35840]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.attn_output.weightQ5_K[5120 5120]
-
blk.27.attn_qkv.weightQ6_K[5120 7680]
-
blk.28.attn_output.weightQ5_K[5120 5120]
-
blk.28.attn_qkv.weightQ6_K[5120 7680]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.ffn_down.weightQ6_K[17920 5120]
-
blk.28.ffn_up.weightQ5_K[5120 35840]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.ffn_down.weightQ5_K[17920 5120]
-
blk.29.ffn_up.weightQ5_K[5120 35840]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.attn_output.weightQ5_K[5120 5120]
-
blk.29.attn_qkv.weightQ6_K[5120 7680]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.ffn_down.weightQ5_K[17920 5120]
-
blk.30.ffn_up.weightQ5_K[5120 35840]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.30.attn_output.weightQ5_K[5120 5120]
-
blk.30.attn_qkv.weightQ6_K[5120 7680]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.ffn_down.weightQ6_K[17920 5120]
-
blk.31.ffn_up.weightQ5_K[5120 35840]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.attn_output.weightQ5_K[5120 5120]
-
blk.31.attn_qkv.weightQ6_K[5120 7680]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.ffn_down.weightQ5_K[17920 5120]
-
blk.32.ffn_up.weightQ5_K[5120 35840]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.32.attn_output.weightQ5_K[5120 5120]
-
blk.32.attn_qkv.weightQ6_K[5120 7680]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.ffn_down.weightQ5_K[17920 5120]
-
blk.33.ffn_up.weightQ5_K[5120 35840]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.33.attn_output.weightQ5_K[5120 5120]
-
blk.33.attn_qkv.weightQ6_K[5120 7680]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.ffn_down.weightQ6_K[17920 5120]
-
blk.34.ffn_up.weightQ5_K[5120 35840]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.34.attn_output.weightQ5_K[5120 5120]
-
blk.34.attn_qkv.weightQ6_K[5120 7680]
-
blk.35.attn_output.weightQ5_K[5120 5120]
-
blk.35.attn_qkv.weightQ6_K[5120 7680]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.ffn_down.weightQ6_K[17920 5120]
-
blk.35.ffn_up.weightQ5_K[5120 35840]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.ffn_down.weightQ6_K[17920 5120]
-
blk.36.ffn_up.weightQ5_K[5120 35840]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.36.attn_output.weightQ5_K[5120 5120]
-
blk.36.attn_qkv.weightQ6_K[5120 7680]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.ffn_down.weightQ6_K[17920 5120]
-
blk.37.ffn_up.weightQ5_K[5120 35840]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.attn_output.weightQ5_K[5120 5120]
-
blk.37.attn_qkv.weightQ6_K[5120 7680]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.ffn_down.weightQ6_K[17920 5120]
-
blk.38.ffn_up.weightQ5_K[5120 35840]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.38.attn_output.weightQ5_K[5120 5120]
-
blk.38.attn_qkv.weightQ6_K[5120 7680]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.ffn_down.weightQ6_K[17920 5120]
-
blk.39.ffn_up.weightQ5_K[5120 35840]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.attn_output.weightQ5_K[5120 5120]
-
blk.39.attn_qkv.weightQ6_K[5120 7680]
-
output.weightQ6_K[5120 32064]
-
output_norm.weightF32[5120]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39