bartowski/Phi-3-medium-128k-instruct-GGUF
14B
175 Pulls Updated 4 months ago
a0da98dc6e5f · 9.6GB
-
quantize.imatrix.chunks_count234
-
quantize.imatrix.dataset/training_data/calibration_data.txt
-
quantize.imatrix.entries_count160
-
quantize.imatrix.file/models/Phi-3-medium-128k-instruct-GGUF/Phi-3-medium-128k-instruct.imatrix
-
general.architecturephi3
-
general.file_typeQ5_K_S
-
phi3.attention.head_count40
-
phi3.attention.head_count_kv10
-
phi3.attention.layer_norm_rms_epsilon1e-05
-
phi3.block_count40
-
phi3.context_length131072
-
phi3.embedding_length5120
-
phi3.feed_forward_length17920
-
phi3.rope.dimension_count128
-
phi3.rope.freq_base10000
-
phi3.rope.scaling.attn_factor1.1902381
-
phi3.rope.scaling.original_context_length4096
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id32000
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id32000
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000 -1000 -1000 0 0 ...]
-
tokenizer.ggml.token_type[3 3 4 6 6 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> <0x00> <0x01> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ5_K[5120 32064]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.ffn_down.weightQ5_K[17920 5120]
-
blk.0.ffn_up.weightQ5_K[5120 35840]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.0.attn_output.weightQ5_K[5120 5120]
-
blk.0.attn_qkv.weightQ5_K[5120 7680]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.ffn_down.weightQ5_K[17920 5120]
-
blk.1.ffn_up.weightQ5_K[5120 35840]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.attn_output.weightQ5_K[5120 5120]
-
blk.1.attn_qkv.weightQ5_K[5120 7680]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.ffn_down.weightQ5_K[17920 5120]
-
blk.2.ffn_up.weightQ5_K[5120 35840]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.2.attn_output.weightQ5_K[5120 5120]
-
blk.2.attn_qkv.weightQ5_K[5120 7680]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.ffn_down.weightQ5_K[17920 5120]
-
blk.3.ffn_up.weightQ5_K[5120 35840]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.3.attn_output.weightQ5_K[5120 5120]
-
blk.3.attn_qkv.weightQ5_K[5120 7680]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.ffn_down.weightQ5_K[17920 5120]
-
blk.4.ffn_up.weightQ5_K[5120 35840]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.4.attn_output.weightQ5_K[5120 5120]
-
blk.4.attn_qkv.weightQ5_K[5120 7680]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.ffn_down.weightQ5_K[17920 5120]
-
blk.5.ffn_up.weightQ5_K[5120 35840]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.attn_output.weightQ5_K[5120 5120]
-
blk.5.attn_qkv.weightQ5_K[5120 7680]
-
blk.6.ffn_up.weightQ5_K[5120 35840]
-
blk.6.attn_output.weightQ5_K[5120 5120]
-
blk.6.attn_qkv.weightQ5_K[5120 7680]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.ffn_down.weightQ5_K[17920 5120]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.ffn_down.weightQ5_K[17920 5120]
-
blk.7.ffn_up.weightQ5_K[5120 35840]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.attn_output.weightQ5_K[5120 5120]
-
blk.7.attn_qkv.weightQ5_K[5120 7680]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.ffn_down.weightQ5_K[17920 5120]
-
blk.8.ffn_up.weightQ5_K[5120 35840]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.8.attn_output.weightQ5_K[5120 5120]
-
blk.8.attn_qkv.weightQ5_K[5120 7680]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.ffn_down.weightQ5_K[17920 5120]
-
blk.9.ffn_up.weightQ5_K[5120 35840]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.attn_output.weightQ5_K[5120 5120]
-
blk.9.attn_qkv.weightQ5_K[5120 7680]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.ffn_down.weightQ5_K[17920 5120]
-
blk.10.ffn_up.weightQ5_K[5120 35840]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.10.attn_output.weightQ5_K[5120 5120]
-
blk.10.attn_qkv.weightQ5_K[5120 7680]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.ffn_down.weightQ5_K[17920 5120]
-
blk.11.ffn_up.weightQ5_K[5120 35840]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.attn_output.weightQ5_K[5120 5120]
-
blk.11.attn_qkv.weightQ5_K[5120 7680]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.ffn_down.weightQ5_K[17920 5120]
-
blk.12.ffn_up.weightQ5_K[5120 35840]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.12.attn_output.weightQ5_K[5120 5120]
-
blk.12.attn_qkv.weightQ5_K[5120 7680]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.ffn_down.weightQ5_K[17920 5120]
-
blk.13.ffn_up.weightQ5_K[5120 35840]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.13.attn_output.weightQ5_K[5120 5120]
-
blk.13.attn_qkv.weightQ5_K[5120 7680]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.ffn_down.weightQ5_K[17920 5120]
-
blk.14.ffn_up.weightQ5_K[5120 35840]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.14.attn_output.weightQ5_K[5120 5120]
-
blk.14.attn_qkv.weightQ5_K[5120 7680]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.ffn_down.weightQ5_K[17920 5120]
-
blk.15.ffn_up.weightQ5_K[5120 35840]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.15.attn_output.weightQ5_K[5120 5120]
-
blk.15.attn_qkv.weightQ5_K[5120 7680]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.ffn_down.weightQ5_K[17920 5120]
-
blk.16.ffn_up.weightQ5_K[5120 35840]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.16.attn_output.weightQ5_K[5120 5120]
-
blk.16.attn_qkv.weightQ5_K[5120 7680]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.ffn_down.weightQ5_K[17920 5120]
-
blk.17.ffn_up.weightQ5_K[5120 35840]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.attn_output.weightQ5_K[5120 5120]
-
blk.17.attn_qkv.weightQ5_K[5120 7680]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.ffn_down.weightQ5_K[17920 5120]
-
blk.18.ffn_up.weightQ5_K[5120 35840]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.18.attn_output.weightQ5_K[5120 5120]
-
blk.18.attn_qkv.weightQ5_K[5120 7680]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.ffn_down.weightQ5_K[17920 5120]
-
blk.19.ffn_up.weightQ5_K[5120 35840]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.attn_output.weightQ5_K[5120 5120]
-
blk.19.attn_qkv.weightQ5_K[5120 7680]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.ffn_down.weightQ5_K[17920 5120]
-
blk.20.ffn_up.weightQ5_K[5120 35840]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.20.attn_output.weightQ5_K[5120 5120]
-
blk.20.attn_qkv.weightQ5_K[5120 7680]
-
blk.21.attn_output.weightQ5_K[5120 5120]
-
blk.21.attn_qkv.weightQ5_K[5120 7680]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.ffn_down.weightQ5_K[17920 5120]
-
blk.21.ffn_up.weightQ5_K[5120 35840]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.ffn_down.weightQ5_K[17920 5120]
-
blk.22.ffn_up.weightQ5_K[5120 35840]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.22.attn_output.weightQ5_K[5120 5120]
-
blk.22.attn_qkv.weightQ5_K[5120 7680]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.ffn_down.weightQ5_K[17920 5120]
-
blk.23.ffn_up.weightQ5_K[5120 35840]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.23.attn_output.weightQ5_K[5120 5120]
-
blk.23.attn_qkv.weightQ5_K[5120 7680]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.ffn_down.weightQ5_K[17920 5120]
-
blk.24.ffn_up.weightQ5_K[5120 35840]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.24.attn_output.weightQ5_K[5120 5120]
-
blk.24.attn_qkv.weightQ5_K[5120 7680]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.ffn_down.weightQ5_K[17920 5120]
-
blk.25.ffn_up.weightQ5_K[5120 35840]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.attn_output.weightQ5_K[5120 5120]
-
blk.25.attn_qkv.weightQ5_K[5120 7680]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.ffn_down.weightQ5_K[17920 5120]
-
blk.26.ffn_up.weightQ5_K[5120 35840]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.26.attn_output.weightQ5_K[5120 5120]
-
blk.26.attn_qkv.weightQ5_K[5120 7680]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.ffn_down.weightQ5_K[17920 5120]
-
blk.27.ffn_up.weightQ5_K[5120 35840]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.attn_output.weightQ5_K[5120 5120]
-
blk.27.attn_qkv.weightQ5_K[5120 7680]
-
blk.28.attn_output.weightQ5_K[5120 5120]
-
blk.28.attn_qkv.weightQ5_K[5120 7680]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.ffn_down.weightQ5_K[17920 5120]
-
blk.28.ffn_up.weightQ5_K[5120 35840]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.ffn_down.weightQ5_K[17920 5120]
-
blk.29.ffn_up.weightQ5_K[5120 35840]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.attn_output.weightQ5_K[5120 5120]
-
blk.29.attn_qkv.weightQ5_K[5120 7680]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.ffn_down.weightQ5_K[17920 5120]
-
blk.30.ffn_up.weightQ5_K[5120 35840]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.30.attn_output.weightQ5_K[5120 5120]
-
blk.30.attn_qkv.weightQ5_K[5120 7680]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.ffn_down.weightQ5_K[17920 5120]
-
blk.31.ffn_up.weightQ5_K[5120 35840]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.attn_output.weightQ5_K[5120 5120]
-
blk.31.attn_qkv.weightQ5_K[5120 7680]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.ffn_down.weightQ5_K[17920 5120]
-
blk.32.ffn_up.weightQ5_K[5120 35840]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.32.attn_output.weightQ5_K[5120 5120]
-
blk.32.attn_qkv.weightQ5_K[5120 7680]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.ffn_down.weightQ5_K[17920 5120]
-
blk.33.ffn_up.weightQ5_K[5120 35840]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.33.attn_output.weightQ5_K[5120 5120]
-
blk.33.attn_qkv.weightQ5_K[5120 7680]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.ffn_down.weightQ5_K[17920 5120]
-
blk.34.ffn_up.weightQ5_K[5120 35840]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.34.attn_output.weightQ5_K[5120 5120]
-
blk.34.attn_qkv.weightQ5_K[5120 7680]
-
blk.35.attn_output.weightQ5_K[5120 5120]
-
blk.35.attn_qkv.weightQ5_K[5120 7680]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.ffn_down.weightQ5_K[17920 5120]
-
blk.35.ffn_up.weightQ5_K[5120 35840]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.ffn_down.weightQ5_K[17920 5120]
-
blk.36.ffn_up.weightQ5_K[5120 35840]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.36.attn_output.weightQ5_K[5120 5120]
-
blk.36.attn_qkv.weightQ5_K[5120 7680]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.ffn_down.weightQ5_K[17920 5120]
-
blk.37.ffn_up.weightQ5_K[5120 35840]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.attn_output.weightQ5_K[5120 5120]
-
blk.37.attn_qkv.weightQ5_K[5120 7680]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.ffn_down.weightQ5_K[17920 5120]
-
blk.38.ffn_up.weightQ5_K[5120 35840]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.38.attn_output.weightQ5_K[5120 5120]
-
blk.38.attn_qkv.weightQ5_K[5120 7680]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.ffn_down.weightQ5_K[17920 5120]
-
blk.39.ffn_up.weightQ5_K[5120 35840]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.attn_output.weightQ5_K[5120 5120]
-
blk.39.attn_qkv.weightQ5_K[5120 7680]
-
output.weightQ6_K[5120 32064]
-
output_norm.weightF32[5120]
-
rope_factors_long.weightF32[64]
-
rope_factors_short.weightF32[64]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39