latest
5.7GB
适配轻小说/Galgame的日中翻译大模型
467 Pulls Updated 6 months ago
d15e8b6954f6 · 5.7GB
-
general.architectureqwen
-
general.file_typeQ2_K_S
-
qwen.attention.head_count40
-
qwen.attention.layer_norm_rms_epsilon1e-06
-
qwen.block_count40
-
qwen.context_length8192
-
qwen.embedding_length5120
-
qwen.feed_forward_length27392
-
qwen.rope.dimension_count128
-
qwen.rope.freq_base10000
-
tokenizer.ggml.bos_token_id151644
-
tokenizer.ggml.eos_token_id151645
-
tokenizer.ggml.merges[Ġ Ġ ĠĠ ĠĠ i n Ġ t ĠĠĠĠ ĠĠĠĠ ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.token_type[1 1 1 1 1 ...]
-
tokenizer.ggml.tokens[! " # $ % ...]
-
tokenizer.ggml.unknown_token_id151643
-
NameTypeShape
-
token_embd.weightQ2_K[5120 152064]
-
blk.0.attn_qkv.biasF32[15360]
-
blk.0.attn_qkv.weightQ2_K[5120 15360]
-
blk.0.attn_output.weightQ2_K[5120 5120]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.0.ffn_down.weightQ5_0[13696 5120]
-
blk.0.ffn_up.weightQ2_K[5120 13696]
-
blk.0.ffn_gate.weightQ2_K[5120 13696]
-
blk.1.attn_qkv.biasF32[15360]
-
blk.1.attn_qkv.weightQ2_K[5120 15360]
-
blk.1.attn_output.weightQ2_K[5120 5120]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.ffn_down.weightQ5_0[13696 5120]
-
blk.1.ffn_up.weightQ2_K[5120 13696]
-
blk.1.ffn_gate.weightQ2_K[5120 13696]
-
blk.2.attn_qkv.biasF32[15360]
-
blk.2.attn_qkv.weightQ2_K[5120 15360]
-
blk.2.attn_output.weightQ2_K[5120 5120]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.2.ffn_down.weightQ4_0[13696 5120]
-
blk.2.ffn_up.weightQ2_K[5120 13696]
-
blk.2.ffn_gate.weightQ2_K[5120 13696]
-
blk.3.attn_qkv.biasF32[15360]
-
blk.3.attn_qkv.weightQ2_K[5120 15360]
-
blk.3.attn_output.weightQ2_K[5120 5120]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.3.ffn_down.weightQ4_0[13696 5120]
-
blk.3.ffn_up.weightQ2_K[5120 13696]
-
blk.3.ffn_gate.weightQ2_K[5120 13696]
-
blk.4.attn_qkv.biasF32[15360]
-
blk.4.attn_qkv.weightQ2_K[5120 15360]
-
blk.4.attn_output.weightQ2_K[5120 5120]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.4.ffn_down.weightQ4_0[13696 5120]
-
blk.4.ffn_up.weightQ2_K[5120 13696]
-
blk.4.ffn_gate.weightQ2_K[5120 13696]
-
blk.5.attn_qkv.biasF32[15360]
-
blk.5.attn_qkv.weightQ2_K[5120 15360]
-
blk.5.attn_output.weightQ2_K[5120 5120]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.ffn_down.weightQ4_0[13696 5120]
-
blk.5.ffn_up.weightQ2_K[5120 13696]
-
blk.5.ffn_gate.weightQ2_K[5120 13696]
-
blk.6.attn_qkv.biasF32[15360]
-
blk.6.attn_qkv.weightQ2_K[5120 15360]
-
blk.6.attn_output.weightQ2_K[5120 5120]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.6.ffn_down.weightQ4_0[13696 5120]
-
blk.6.ffn_up.weightQ2_K[5120 13696]
-
blk.6.ffn_gate.weightQ2_K[5120 13696]
-
blk.7.attn_qkv.biasF32[15360]
-
blk.7.attn_qkv.weightQ2_K[5120 15360]
-
blk.7.attn_output.weightQ2_K[5120 5120]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.ffn_down.weightQ4_0[13696 5120]
-
blk.7.ffn_up.weightQ2_K[5120 13696]
-
blk.7.ffn_gate.weightQ2_K[5120 13696]
-
blk.8.attn_qkv.biasF32[15360]
-
blk.8.attn_qkv.weightQ2_K[5120 15360]
-
blk.8.attn_output.weightQ2_K[5120 5120]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.8.ffn_down.weightQ4_0[13696 5120]
-
blk.8.ffn_up.weightQ2_K[5120 13696]
-
blk.8.ffn_gate.weightQ2_K[5120 13696]
-
blk.9.attn_qkv.biasF32[15360]
-
blk.9.attn_qkv.weightQ2_K[5120 15360]
-
blk.9.attn_output.weightQ2_K[5120 5120]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.ffn_down.weightQ4_0[13696 5120]
-
blk.9.ffn_up.weightQ2_K[5120 13696]
-
blk.9.ffn_gate.weightQ2_K[5120 13696]
-
blk.10.attn_qkv.biasF32[15360]
-
blk.10.attn_qkv.weightQ2_K[5120 15360]
-
blk.10.attn_output.weightQ2_K[5120 5120]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.10.ffn_down.weightQ5_0[13696 5120]
-
blk.10.ffn_up.weightQ2_K[5120 13696]
-
blk.10.ffn_gate.weightQ2_K[5120 13696]
-
blk.11.attn_qkv.biasF32[15360]
-
blk.11.attn_qkv.weightQ2_K[5120 15360]
-
blk.11.attn_output.weightQ2_K[5120 5120]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.ffn_down.weightQ5_0[13696 5120]
-
blk.11.ffn_up.weightQ2_K[5120 13696]
-
blk.11.ffn_gate.weightQ2_K[5120 13696]
-
blk.12.attn_qkv.biasF32[15360]
-
blk.12.attn_qkv.weightQ2_K[5120 15360]
-
blk.12.attn_output.weightQ2_K[5120 5120]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.12.ffn_down.weightQ5_0[13696 5120]
-
blk.12.ffn_up.weightQ2_K[5120 13696]
-
blk.12.ffn_gate.weightQ2_K[5120 13696]
-
blk.13.attn_qkv.biasF32[15360]
-
blk.13.attn_qkv.weightQ2_K[5120 15360]
-
blk.13.attn_output.weightQ2_K[5120 5120]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.13.ffn_down.weightQ4_0[13696 5120]
-
blk.13.ffn_up.weightQ2_K[5120 13696]
-
blk.13.ffn_gate.weightQ2_K[5120 13696]
-
blk.14.attn_qkv.biasF32[15360]
-
blk.14.attn_qkv.weightQ2_K[5120 15360]
-
blk.14.attn_output.weightQ2_K[5120 5120]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.14.ffn_down.weightQ4_0[13696 5120]
-
blk.14.ffn_up.weightQ2_K[5120 13696]
-
blk.14.ffn_gate.weightQ2_K[5120 13696]
-
blk.15.attn_qkv.biasF32[15360]
-
blk.15.attn_qkv.weightQ2_K[5120 15360]
-
blk.15.attn_output.weightQ2_K[5120 5120]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.15.ffn_down.weightQ4_0[13696 5120]
-
blk.15.ffn_up.weightQ2_K[5120 13696]
-
blk.15.ffn_gate.weightQ2_K[5120 13696]
-
blk.16.attn_qkv.biasF32[15360]
-
blk.16.attn_qkv.weightQ2_K[5120 15360]
-
blk.16.attn_output.weightQ2_K[5120 5120]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.16.ffn_down.weightQ4_0[13696 5120]
-
blk.16.ffn_up.weightQ2_K[5120 13696]
-
blk.16.ffn_gate.weightQ2_K[5120 13696]
-
blk.17.attn_qkv.biasF32[15360]
-
blk.17.attn_qkv.weightQ2_K[5120 15360]
-
blk.17.attn_output.weightQ2_K[5120 5120]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.ffn_down.weightQ4_0[13696 5120]
-
blk.17.ffn_up.weightQ2_K[5120 13696]
-
blk.17.ffn_gate.weightQ2_K[5120 13696]
-
blk.18.attn_qkv.biasF32[15360]
-
blk.18.attn_qkv.weightQ2_K[5120 15360]
-
blk.18.attn_output.weightQ2_K[5120 5120]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.18.ffn_down.weightQ4_0[13696 5120]
-
blk.18.ffn_up.weightQ2_K[5120 13696]
-
blk.18.ffn_gate.weightQ2_K[5120 13696]
-
blk.19.attn_qkv.biasF32[15360]
-
blk.19.attn_qkv.weightQ2_K[5120 15360]
-
blk.19.attn_output.weightQ2_K[5120 5120]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.ffn_down.weightQ4_0[13696 5120]
-
blk.19.ffn_up.weightQ2_K[5120 13696]
-
blk.19.ffn_gate.weightQ2_K[5120 13696]
-
blk.20.attn_qkv.biasF32[15360]
-
blk.20.attn_qkv.weightQ2_K[5120 15360]
-
blk.20.attn_output.weightQ2_K[5120 5120]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.20.ffn_down.weightQ4_0[13696 5120]
-
blk.20.ffn_up.weightQ2_K[5120 13696]
-
blk.20.ffn_gate.weightQ2_K[5120 13696]
-
blk.21.attn_qkv.biasF32[15360]
-
blk.21.attn_qkv.weightQ2_K[5120 15360]
-
blk.21.attn_output.weightQ2_K[5120 5120]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.21.ffn_down.weightQ4_0[13696 5120]
-
blk.21.ffn_up.weightQ2_K[5120 13696]
-
blk.21.ffn_gate.weightQ2_K[5120 13696]
-
blk.22.attn_qkv.biasF32[15360]
-
blk.22.attn_qkv.weightQ2_K[5120 15360]
-
blk.22.attn_output.weightQ2_K[5120 5120]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.22.ffn_down.weightQ4_0[13696 5120]
-
blk.22.ffn_up.weightQ2_K[5120 13696]
-
blk.22.ffn_gate.weightQ2_K[5120 13696]
-
blk.23.attn_qkv.biasF32[15360]
-
blk.23.attn_qkv.weightQ2_K[5120 15360]
-
blk.23.attn_output.weightQ2_K[5120 5120]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.23.ffn_down.weightQ4_0[13696 5120]
-
blk.23.ffn_up.weightQ2_K[5120 13696]
-
blk.23.ffn_gate.weightQ2_K[5120 13696]
-
blk.24.attn_qkv.biasF32[15360]
-
blk.24.attn_qkv.weightQ2_K[5120 15360]
-
blk.24.attn_output.weightQ2_K[5120 5120]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.24.ffn_down.weightQ4_0[13696 5120]
-
blk.24.ffn_up.weightQ2_K[5120 13696]
-
blk.24.ffn_gate.weightQ2_K[5120 13696]
-
blk.25.attn_qkv.biasF32[15360]
-
blk.25.attn_qkv.weightQ2_K[5120 15360]
-
blk.25.attn_output.weightQ2_K[5120 5120]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.ffn_down.weightQ4_0[13696 5120]
-
blk.25.ffn_up.weightQ2_K[5120 13696]
-
blk.25.ffn_gate.weightQ2_K[5120 13696]
-
blk.26.attn_qkv.biasF32[15360]
-
blk.26.attn_qkv.weightQ2_K[5120 15360]
-
blk.26.attn_output.weightQ2_K[5120 5120]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.26.ffn_down.weightQ4_0[13696 5120]
-
blk.26.ffn_up.weightQ2_K[5120 13696]
-
blk.26.ffn_gate.weightQ2_K[5120 13696]
-
blk.27.attn_qkv.biasF32[15360]
-
blk.27.attn_qkv.weightQ2_K[5120 15360]
-
blk.27.attn_output.weightQ2_K[5120 5120]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.ffn_down.weightQ4_0[13696 5120]
-
blk.27.ffn_up.weightQ2_K[5120 13696]
-
blk.27.ffn_gate.weightQ2_K[5120 13696]
-
blk.28.attn_qkv.biasF32[15360]
-
blk.28.attn_qkv.weightQ2_K[5120 15360]
-
blk.28.attn_output.weightQ2_K[5120 5120]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.28.ffn_down.weightQ4_0[13696 5120]
-
blk.28.ffn_up.weightQ2_K[5120 13696]
-
blk.28.ffn_gate.weightQ2_K[5120 13696]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.attn_qkv.biasF32[15360]
-
blk.29.attn_qkv.weightQ2_K[5120 15360]
-
blk.29.attn_output.weightQ2_K[5120 5120]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.ffn_down.weightQ4_0[13696 5120]
-
blk.29.ffn_up.weightQ2_K[5120 13696]
-
blk.29.ffn_gate.weightQ2_K[5120 13696]
-
blk.30.attn_qkv.biasF32[15360]
-
blk.30.attn_qkv.weightQ2_K[5120 15360]
-
blk.30.attn_output.weightQ2_K[5120 5120]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.30.ffn_down.weightQ4_0[13696 5120]
-
blk.30.ffn_up.weightQ2_K[5120 13696]
-
blk.30.ffn_gate.weightQ2_K[5120 13696]
-
blk.31.attn_qkv.biasF32[15360]
-
blk.31.attn_qkv.weightQ2_K[5120 15360]
-
blk.31.attn_output.weightQ2_K[5120 5120]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.ffn_down.weightQ4_0[13696 5120]
-
blk.31.ffn_up.weightQ2_K[5120 13696]
-
blk.31.ffn_gate.weightQ2_K[5120 13696]
-
blk.32.attn_qkv.biasF32[15360]
-
blk.32.attn_qkv.weightQ2_K[5120 15360]
-
blk.32.attn_output.weightQ2_K[5120 5120]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.32.ffn_down.weightQ4_0[13696 5120]
-
blk.32.ffn_up.weightQ2_K[5120 13696]
-
blk.32.ffn_gate.weightQ2_K[5120 13696]
-
blk.33.attn_qkv.biasF32[15360]
-
blk.33.attn_qkv.weightQ2_K[5120 15360]
-
blk.33.attn_output.weightQ2_K[5120 5120]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.33.ffn_down.weightQ4_0[13696 5120]
-
blk.33.ffn_up.weightQ2_K[5120 13696]
-
blk.33.ffn_gate.weightQ2_K[5120 13696]
-
blk.34.attn_qkv.biasF32[15360]
-
blk.34.attn_qkv.weightQ2_K[5120 15360]
-
blk.34.attn_output.weightQ2_K[5120 5120]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.34.ffn_down.weightQ4_0[13696 5120]
-
blk.34.ffn_up.weightQ2_K[5120 13696]
-
blk.34.ffn_gate.weightQ2_K[5120 13696]
-
blk.35.attn_qkv.biasF32[15360]
-
blk.35.attn_qkv.weightQ2_K[5120 15360]
-
blk.35.attn_output.weightQ2_K[5120 5120]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.35.ffn_down.weightQ4_0[13696 5120]
-
blk.35.ffn_up.weightQ2_K[5120 13696]
-
blk.35.ffn_gate.weightQ2_K[5120 13696]
-
blk.36.attn_qkv.biasF32[15360]
-
blk.36.attn_qkv.weightQ2_K[5120 15360]
-
blk.36.attn_output.weightQ2_K[5120 5120]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.36.ffn_down.weightQ4_0[13696 5120]
-
blk.36.ffn_up.weightQ2_K[5120 13696]
-
blk.36.ffn_gate.weightQ2_K[5120 13696]
-
blk.37.attn_qkv.biasF32[15360]
-
blk.37.attn_qkv.weightQ2_K[5120 15360]
-
blk.37.attn_output.weightQ2_K[5120 5120]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.ffn_down.weightQ4_0[13696 5120]
-
blk.37.ffn_up.weightQ2_K[5120 13696]
-
blk.37.ffn_gate.weightQ2_K[5120 13696]
-
blk.38.attn_qkv.biasF32[15360]
-
blk.38.attn_qkv.weightQ2_K[5120 15360]
-
blk.38.attn_output.weightQ2_K[5120 5120]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.38.ffn_down.weightQ4_0[13696 5120]
-
blk.38.ffn_up.weightQ2_K[5120 13696]
-
blk.38.ffn_gate.weightQ2_K[5120 13696]
-
blk.39.attn_qkv.biasF32[15360]
-
blk.39.attn_qkv.weightQ2_K[5120 15360]
-
blk.39.attn_output.weightQ2_K[5120 5120]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.ffn_down.weightQ4_0[13696 5120]
-
blk.39.ffn_up.weightQ2_K[5120 13696]
-
blk.39.ffn_gate.weightQ2_K[5120 13696]
-
output.weightQ6_K[5120 152064]
-
output_norm.weightF32[5120]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39