128k_q8_0
15GB
128K_Q8_0
14B
121 Pulls Updated 3 months ago
25816d2b932c · 15GB
-
quantize.imatrix.chunks_count234
-
quantize.imatrix.dataset/training_data/calibration_data.txt
-
quantize.imatrix.entries_count160
-
quantize.imatrix.file/models/Phi-3-medium-4k-instruct-GGUF/Phi-3-medium-4k-instruct.imatrix
-
general.architecturephi3
-
general.file_typeQ8_0
-
phi3.attention.head_count40
-
phi3.attention.head_count_kv10
-
phi3.attention.layer_norm_rms_epsilon1e-05
-
phi3.block_count40
-
phi3.context_length4096
-
phi3.embedding_length5120
-
phi3.feed_forward_length17920
-
phi3.rope.dimension_count128
-
phi3.rope.freq_base10000
-
phi3.rope.scaling.original_context_length4096
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id32000
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id32000
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000 -1000 -1000 0 0 ...]
-
tokenizer.ggml.token_type[3 3 4 6 6 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> <0x00> <0x01> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ8_0[5120 32064]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.ffn_down.weightQ8_0[17920 5120]
-
blk.0.ffn_up.weightQ8_0[5120 35840]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.0.attn_output.weightQ8_0[5120 5120]
-
blk.0.attn_qkv.weightQ8_0[5120 7680]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.ffn_down.weightQ8_0[17920 5120]
-
blk.1.ffn_up.weightQ8_0[5120 35840]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.attn_output.weightQ8_0[5120 5120]
-
blk.1.attn_qkv.weightQ8_0[5120 7680]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.ffn_down.weightQ8_0[17920 5120]
-
blk.2.ffn_up.weightQ8_0[5120 35840]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.2.attn_output.weightQ8_0[5120 5120]
-
blk.2.attn_qkv.weightQ8_0[5120 7680]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.ffn_down.weightQ8_0[17920 5120]
-
blk.3.ffn_up.weightQ8_0[5120 35840]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.3.attn_output.weightQ8_0[5120 5120]
-
blk.3.attn_qkv.weightQ8_0[5120 7680]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.ffn_down.weightQ8_0[17920 5120]
-
blk.4.ffn_up.weightQ8_0[5120 35840]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.4.attn_output.weightQ8_0[5120 5120]
-
blk.4.attn_qkv.weightQ8_0[5120 7680]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.ffn_down.weightQ8_0[17920 5120]
-
blk.5.ffn_up.weightQ8_0[5120 35840]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.attn_output.weightQ8_0[5120 5120]
-
blk.5.attn_qkv.weightQ8_0[5120 7680]
-
blk.6.ffn_up.weightQ8_0[5120 35840]
-
blk.6.attn_output.weightQ8_0[5120 5120]
-
blk.6.attn_qkv.weightQ8_0[5120 7680]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.ffn_down.weightQ8_0[17920 5120]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.ffn_down.weightQ8_0[17920 5120]
-
blk.7.ffn_up.weightQ8_0[5120 35840]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.attn_output.weightQ8_0[5120 5120]
-
blk.7.attn_qkv.weightQ8_0[5120 7680]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.ffn_down.weightQ8_0[17920 5120]
-
blk.8.ffn_up.weightQ8_0[5120 35840]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.8.attn_output.weightQ8_0[5120 5120]
-
blk.8.attn_qkv.weightQ8_0[5120 7680]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.ffn_down.weightQ8_0[17920 5120]
-
blk.9.ffn_up.weightQ8_0[5120 35840]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.attn_output.weightQ8_0[5120 5120]
-
blk.9.attn_qkv.weightQ8_0[5120 7680]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.ffn_down.weightQ8_0[17920 5120]
-
blk.10.ffn_up.weightQ8_0[5120 35840]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.10.attn_output.weightQ8_0[5120 5120]
-
blk.10.attn_qkv.weightQ8_0[5120 7680]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.ffn_down.weightQ8_0[17920 5120]
-
blk.11.ffn_up.weightQ8_0[5120 35840]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.attn_output.weightQ8_0[5120 5120]
-
blk.11.attn_qkv.weightQ8_0[5120 7680]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.ffn_down.weightQ8_0[17920 5120]
-
blk.12.ffn_up.weightQ8_0[5120 35840]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.12.attn_output.weightQ8_0[5120 5120]
-
blk.12.attn_qkv.weightQ8_0[5120 7680]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.ffn_down.weightQ8_0[17920 5120]
-
blk.13.ffn_up.weightQ8_0[5120 35840]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.13.attn_output.weightQ8_0[5120 5120]
-
blk.13.attn_qkv.weightQ8_0[5120 7680]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.ffn_down.weightQ8_0[17920 5120]
-
blk.14.ffn_up.weightQ8_0[5120 35840]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.14.attn_output.weightQ8_0[5120 5120]
-
blk.14.attn_qkv.weightQ8_0[5120 7680]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.ffn_down.weightQ8_0[17920 5120]
-
blk.15.ffn_up.weightQ8_0[5120 35840]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.15.attn_output.weightQ8_0[5120 5120]
-
blk.15.attn_qkv.weightQ8_0[5120 7680]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.ffn_down.weightQ8_0[17920 5120]
-
blk.16.ffn_up.weightQ8_0[5120 35840]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.16.attn_output.weightQ8_0[5120 5120]
-
blk.16.attn_qkv.weightQ8_0[5120 7680]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.ffn_down.weightQ8_0[17920 5120]
-
blk.17.ffn_up.weightQ8_0[5120 35840]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.attn_output.weightQ8_0[5120 5120]
-
blk.17.attn_qkv.weightQ8_0[5120 7680]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.ffn_down.weightQ8_0[17920 5120]
-
blk.18.ffn_up.weightQ8_0[5120 35840]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.18.attn_output.weightQ8_0[5120 5120]
-
blk.18.attn_qkv.weightQ8_0[5120 7680]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.ffn_down.weightQ8_0[17920 5120]
-
blk.19.ffn_up.weightQ8_0[5120 35840]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.attn_output.weightQ8_0[5120 5120]
-
blk.19.attn_qkv.weightQ8_0[5120 7680]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.ffn_down.weightQ8_0[17920 5120]
-
blk.20.ffn_up.weightQ8_0[5120 35840]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.20.attn_output.weightQ8_0[5120 5120]
-
blk.20.attn_qkv.weightQ8_0[5120 7680]
-
blk.21.attn_output.weightQ8_0[5120 5120]
-
blk.21.attn_qkv.weightQ8_0[5120 7680]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.ffn_down.weightQ8_0[17920 5120]
-
blk.21.ffn_up.weightQ8_0[5120 35840]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.ffn_down.weightQ8_0[17920 5120]
-
blk.22.ffn_up.weightQ8_0[5120 35840]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.22.attn_output.weightQ8_0[5120 5120]
-
blk.22.attn_qkv.weightQ8_0[5120 7680]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.ffn_down.weightQ8_0[17920 5120]
-
blk.23.ffn_up.weightQ8_0[5120 35840]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.23.attn_output.weightQ8_0[5120 5120]
-
blk.23.attn_qkv.weightQ8_0[5120 7680]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.ffn_down.weightQ8_0[17920 5120]
-
blk.24.ffn_up.weightQ8_0[5120 35840]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.24.attn_output.weightQ8_0[5120 5120]
-
blk.24.attn_qkv.weightQ8_0[5120 7680]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.ffn_down.weightQ8_0[17920 5120]
-
blk.25.ffn_up.weightQ8_0[5120 35840]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.attn_output.weightQ8_0[5120 5120]
-
blk.25.attn_qkv.weightQ8_0[5120 7680]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.ffn_down.weightQ8_0[17920 5120]
-
blk.26.ffn_up.weightQ8_0[5120 35840]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.26.attn_output.weightQ8_0[5120 5120]
-
blk.26.attn_qkv.weightQ8_0[5120 7680]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.ffn_down.weightQ8_0[17920 5120]
-
blk.27.ffn_up.weightQ8_0[5120 35840]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.attn_output.weightQ8_0[5120 5120]
-
blk.27.attn_qkv.weightQ8_0[5120 7680]
-
blk.28.attn_output.weightQ8_0[5120 5120]
-
blk.28.attn_qkv.weightQ8_0[5120 7680]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.ffn_down.weightQ8_0[17920 5120]
-
blk.28.ffn_up.weightQ8_0[5120 35840]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.ffn_down.weightQ8_0[17920 5120]
-
blk.29.ffn_up.weightQ8_0[5120 35840]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.attn_output.weightQ8_0[5120 5120]
-
blk.29.attn_qkv.weightQ8_0[5120 7680]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.ffn_down.weightQ8_0[17920 5120]
-
blk.30.ffn_up.weightQ8_0[5120 35840]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.30.attn_output.weightQ8_0[5120 5120]
-
blk.30.attn_qkv.weightQ8_0[5120 7680]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.ffn_down.weightQ8_0[17920 5120]
-
blk.31.ffn_up.weightQ8_0[5120 35840]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.attn_output.weightQ8_0[5120 5120]
-
blk.31.attn_qkv.weightQ8_0[5120 7680]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.ffn_down.weightQ8_0[17920 5120]
-
blk.32.ffn_up.weightQ8_0[5120 35840]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.32.attn_output.weightQ8_0[5120 5120]
-
blk.32.attn_qkv.weightQ8_0[5120 7680]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.ffn_down.weightQ8_0[17920 5120]
-
blk.33.ffn_up.weightQ8_0[5120 35840]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.33.attn_output.weightQ8_0[5120 5120]
-
blk.33.attn_qkv.weightQ8_0[5120 7680]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.ffn_down.weightQ8_0[17920 5120]
-
blk.34.ffn_up.weightQ8_0[5120 35840]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.34.attn_output.weightQ8_0[5120 5120]
-
blk.34.attn_qkv.weightQ8_0[5120 7680]
-
blk.35.attn_output.weightQ8_0[5120 5120]
-
blk.35.attn_qkv.weightQ8_0[5120 7680]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.ffn_down.weightQ8_0[17920 5120]
-
blk.35.ffn_up.weightQ8_0[5120 35840]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.ffn_down.weightQ8_0[17920 5120]
-
blk.36.ffn_up.weightQ8_0[5120 35840]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.36.attn_output.weightQ8_0[5120 5120]
-
blk.36.attn_qkv.weightQ8_0[5120 7680]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.ffn_down.weightQ8_0[17920 5120]
-
blk.37.ffn_up.weightQ8_0[5120 35840]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.attn_output.weightQ8_0[5120 5120]
-
blk.37.attn_qkv.weightQ8_0[5120 7680]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.ffn_down.weightQ8_0[17920 5120]
-
blk.38.ffn_up.weightQ8_0[5120 35840]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.38.attn_output.weightQ8_0[5120 5120]
-
blk.38.attn_qkv.weightQ8_0[5120 7680]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.ffn_down.weightQ8_0[17920 5120]
-
blk.39.ffn_up.weightQ8_0[5120 35840]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.attn_output.weightQ8_0[5120 5120]
-
blk.39.attn_qkv.weightQ8_0[5120 7680]
-
output.weightQ8_0[5120 32064]
-
output_norm.weightF32[5120]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39