22B
8 Pulls Updated 4 days ago
e94d1c65a4a7 · 44GB
-
general.architecturesolar
-
general.file_typeF16
-
solar.attention.block_skip_connection.00
-
solar.attention.block_skip_connection.10
-
solar.attention.block_skip_connection.20
-
solar.attention.block_skip_connection.30
-
solar.attention.head_count40
-
solar.attention.head_count_kv10
-
solar.attention.layer_norm_rms_epsilon1e-05
-
solar.block_count64
-
solar.context_length4096
-
solar.embedding_length5120
-
solar.feed_forward_length17920
-
solar.rope.dimension_count128
-
solar.rope.freq_base10000
-
solar.vocab_size32128
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id32007
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.padding_token_id32007
-
tokenizer.ggml.predefault
-
tokenizer.ggml.scores[-1000 -1000 -1000 -1000 -1000 ...]
-
tokenizer.ggml.token_type[3 3 1 6 6 ...]
-
tokenizer.ggml.tokens[<unk> <|startoftext|> <|endoftext|> <0x00> <0x01> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightF16[5120 32128]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.ffn_down.weightF16[17920 5120]
-
blk.0.ffn_gate.weightF16[5120 17920]
-
blk.0.ffn_up.weightF16[5120 17920]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.0.attn_k.weightF16[5120 1280]
-
blk.0.attn_output.weightF16[5120 5120]
-
blk.0.attn_q.weightF16[5120 5120]
-
blk.0.attn_v.weightF16[5120 1280]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.ffn_down.weightF16[17920 5120]
-
blk.1.ffn_gate.weightF16[5120 17920]
-
blk.1.ffn_up.weightF16[5120 17920]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.attn_k.weightF16[5120 1280]
-
blk.1.attn_output.weightF16[5120 5120]
-
blk.1.attn_q.weightF16[5120 5120]
-
blk.1.attn_v.weightF16[5120 1280]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.ffn_down.weightF16[17920 5120]
-
blk.2.ffn_gate.weightF16[5120 17920]
-
blk.2.ffn_up.weightF16[5120 17920]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.2.attn_k.weightF16[5120 1280]
-
blk.2.attn_output.weightF16[5120 5120]
-
blk.2.attn_q.weightF16[5120 5120]
-
blk.2.attn_v.weightF16[5120 1280]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.ffn_down.weightF16[17920 5120]
-
blk.3.ffn_gate.weightF16[5120 17920]
-
blk.3.ffn_up.weightF16[5120 17920]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.3.attn_k.weightF16[5120 1280]
-
blk.3.attn_output.weightF16[5120 5120]
-
blk.3.attn_q.weightF16[5120 5120]
-
blk.3.attn_v.weightF16[5120 1280]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.ffn_down.weightF16[17920 5120]
-
blk.4.ffn_gate.weightF16[5120 17920]
-
blk.4.ffn_up.weightF16[5120 17920]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.4.attn_k.weightF16[5120 1280]
-
blk.4.attn_output.weightF16[5120 5120]
-
blk.4.attn_q.weightF16[5120 5120]
-
blk.4.attn_v.weightF16[5120 1280]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.ffn_down.weightF16[17920 5120]
-
blk.5.ffn_gate.weightF16[5120 17920]
-
blk.5.ffn_up.weightF16[5120 17920]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.attn_k.weightF16[5120 1280]
-
blk.5.attn_output.weightF16[5120 5120]
-
blk.5.attn_q.weightF16[5120 5120]
-
blk.5.attn_v.weightF16[5120 1280]
-
blk.6.ffn_gate.weightF16[5120 17920]
-
blk.6.ffn_up.weightF16[5120 17920]
-
blk.6.attn_k.weightF16[5120 1280]
-
blk.6.attn_output.weightF16[5120 5120]
-
blk.6.attn_q.weightF16[5120 5120]
-
blk.6.attn_v.weightF16[5120 1280]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.ffn_down.weightF16[17920 5120]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.ffn_down.weightF16[17920 5120]
-
blk.7.ffn_gate.weightF16[5120 17920]
-
blk.7.ffn_up.weightF16[5120 17920]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.attn_k.weightF16[5120 1280]
-
blk.7.attn_output.weightF16[5120 5120]
-
blk.7.attn_q.weightF16[5120 5120]
-
blk.7.attn_v.weightF16[5120 1280]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.ffn_down.weightF16[17920 5120]
-
blk.8.ffn_gate.weightF16[5120 17920]
-
blk.8.ffn_up.weightF16[5120 17920]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.8.attn_k.weightF16[5120 1280]
-
blk.8.attn_output.weightF16[5120 5120]
-
blk.8.attn_q.weightF16[5120 5120]
-
blk.8.attn_v.weightF16[5120 1280]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.ffn_down.weightF16[17920 5120]
-
blk.9.ffn_gate.weightF16[5120 17920]
-
blk.9.ffn_up.weightF16[5120 17920]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.attn_k.weightF16[5120 1280]
-
blk.9.attn_output.weightF16[5120 5120]
-
blk.9.attn_q.weightF16[5120 5120]
-
blk.9.attn_v.weightF16[5120 1280]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.ffn_down.weightF16[17920 5120]
-
blk.10.ffn_gate.weightF16[5120 17920]
-
blk.10.ffn_up.weightF16[5120 17920]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.10.attn_k.weightF16[5120 1280]
-
blk.10.attn_output.weightF16[5120 5120]
-
blk.10.attn_q.weightF16[5120 5120]
-
blk.10.attn_v.weightF16[5120 1280]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.ffn_down.weightF16[17920 5120]
-
blk.11.ffn_gate.weightF16[5120 17920]
-
blk.11.ffn_up.weightF16[5120 17920]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.attn_k.weightF16[5120 1280]
-
blk.11.attn_output.weightF16[5120 5120]
-
blk.11.attn_q.weightF16[5120 5120]
-
blk.11.attn_v.weightF16[5120 1280]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.ffn_down.weightF16[17920 5120]
-
blk.12.ffn_gate.weightF16[5120 17920]
-
blk.12.ffn_up.weightF16[5120 17920]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.12.attn_k.weightF16[5120 1280]
-
blk.12.attn_output.weightF16[5120 5120]
-
blk.12.attn_q.weightF16[5120 5120]
-
blk.12.attn_v.weightF16[5120 1280]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.ffn_down.weightF16[17920 5120]
-
blk.13.ffn_gate.weightF16[5120 17920]
-
blk.13.ffn_up.weightF16[5120 17920]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.13.attn_k.weightF16[5120 1280]
-
blk.13.attn_output.weightF16[5120 5120]
-
blk.13.attn_q.weightF16[5120 5120]
-
blk.13.attn_v.weightF16[5120 1280]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.ffn_down.weightF16[17920 5120]
-
blk.14.ffn_gate.weightF16[5120 17920]
-
blk.14.ffn_up.weightF16[5120 17920]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.14.attn_k.weightF16[5120 1280]
-
blk.14.attn_output.weightF16[5120 5120]
-
blk.14.attn_q.weightF16[5120 5120]
-
blk.14.attn_v.weightF16[5120 1280]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.ffn_down.weightF16[17920 5120]
-
blk.15.ffn_gate.weightF16[5120 17920]
-
blk.15.ffn_up.weightF16[5120 17920]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.15.attn_k.weightF16[5120 1280]
-
blk.15.attn_output.weightF16[5120 5120]
-
blk.15.attn_q.weightF16[5120 5120]
-
blk.15.attn_v.weightF16[5120 1280]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.ffn_down.weightF16[17920 5120]
-
blk.16.ffn_gate.weightF16[5120 17920]
-
blk.16.ffn_up.weightF16[5120 17920]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.16.attn_k.weightF16[5120 1280]
-
blk.16.attn_output.weightF16[5120 5120]
-
blk.16.attn_q.weightF16[5120 5120]
-
blk.16.attn_v.weightF16[5120 1280]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.ffn_down.weightF16[17920 5120]
-
blk.17.ffn_gate.weightF16[5120 17920]
-
blk.17.ffn_up.weightF16[5120 17920]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.attn_k.weightF16[5120 1280]
-
blk.17.attn_output.weightF16[5120 5120]
-
blk.17.attn_q.weightF16[5120 5120]
-
blk.17.attn_v.weightF16[5120 1280]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.ffn_down.weightF16[17920 5120]
-
blk.18.ffn_gate.weightF16[5120 17920]
-
blk.18.ffn_up.weightF16[5120 17920]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.18.attn_k.weightF16[5120 1280]
-
blk.18.attn_output.weightF16[5120 5120]
-
blk.18.attn_q.weightF16[5120 5120]
-
blk.18.attn_v.weightF16[5120 1280]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.ffn_down.weightF16[17920 5120]
-
blk.19.ffn_gate.weightF16[5120 17920]
-
blk.19.ffn_up.weightF16[5120 17920]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.attn_k.weightF16[5120 1280]
-
blk.19.attn_output.weightF16[5120 5120]
-
blk.19.attn_q.weightF16[5120 5120]
-
blk.19.attn_v.weightF16[5120 1280]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.ffn_down.weightF16[17920 5120]
-
blk.20.ffn_gate.weightF16[5120 17920]
-
blk.20.ffn_up.weightF16[5120 17920]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.20.attn_k.weightF16[5120 1280]
-
blk.20.attn_output.weightF16[5120 5120]
-
blk.20.attn_q.weightF16[5120 5120]
-
blk.20.attn_v.weightF16[5120 1280]
-
blk.21.attn_k.weightF16[5120 1280]
-
blk.21.attn_output.weightF16[5120 5120]
-
blk.21.attn_q.weightF16[5120 5120]
-
blk.21.attn_v.weightF16[5120 1280]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.ffn_down.weightF16[17920 5120]
-
blk.21.ffn_gate.weightF16[5120 17920]
-
blk.21.ffn_up.weightF16[5120 17920]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.ffn_down.weightF16[17920 5120]
-
blk.22.ffn_gate.weightF16[5120 17920]
-
blk.22.ffn_up.weightF16[5120 17920]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.22.attn_k.weightF16[5120 1280]
-
blk.22.attn_output.weightF16[5120 5120]
-
blk.22.attn_q.weightF16[5120 5120]
-
blk.22.attn_v.weightF16[5120 1280]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.ffn_down.weightF16[17920 5120]
-
blk.23.ffn_gate.weightF16[5120 17920]
-
blk.23.ffn_up.weightF16[5120 17920]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.23.attn_k.weightF16[5120 1280]
-
blk.23.attn_output.weightF16[5120 5120]
-
blk.23.attn_q.weightF16[5120 5120]
-
blk.23.attn_v.weightF16[5120 1280]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.ffn_down.weightF16[17920 5120]
-
blk.24.ffn_gate.weightF16[5120 17920]
-
blk.24.ffn_up.weightF16[5120 17920]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.24.attn_k.weightF16[5120 1280]
-
blk.24.attn_output.weightF16[5120 5120]
-
blk.24.attn_q.weightF16[5120 5120]
-
blk.24.attn_v.weightF16[5120 1280]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.ffn_down.weightF16[17920 5120]
-
blk.25.ffn_gate.weightF16[5120 17920]
-
blk.25.ffn_up.weightF16[5120 17920]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.attn_k.weightF16[5120 1280]
-
blk.25.attn_output.weightF16[5120 5120]
-
blk.25.attn_q.weightF16[5120 5120]
-
blk.25.attn_v.weightF16[5120 1280]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.ffn_down.weightF16[17920 5120]
-
blk.26.ffn_gate.weightF16[5120 17920]
-
blk.26.ffn_up.weightF16[5120 17920]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.26.attn_k.weightF16[5120 1280]
-
blk.26.attn_output.weightF16[5120 5120]
-
blk.26.attn_q.weightF16[5120 5120]
-
blk.26.attn_v.weightF16[5120 1280]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.ffn_down.weightF16[17920 5120]
-
blk.27.ffn_gate.weightF16[5120 17920]
-
blk.27.ffn_up.weightF16[5120 17920]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.attn_k.weightF16[5120 1280]
-
blk.27.attn_output.weightF16[5120 5120]
-
blk.27.attn_q.weightF16[5120 5120]
-
blk.27.attn_v.weightF16[5120 1280]
-
blk.28.ffn_gate.weightF16[5120 17920]
-
blk.28.attn_k.weightF16[5120 1280]
-
blk.28.attn_output.weightF16[5120 5120]
-
blk.28.attn_q.weightF16[5120 5120]
-
blk.28.attn_v.weightF16[5120 1280]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.ffn_down.weightF16[17920 5120]
-
blk.28.ffn_up.weightF16[5120 17920]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.ffn_down.weightF16[17920 5120]
-
blk.29.ffn_gate.weightF16[5120 17920]
-
blk.29.ffn_up.weightF16[5120 17920]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.attn_k.weightF16[5120 1280]
-
blk.29.attn_output.weightF16[5120 5120]
-
blk.29.attn_q.weightF16[5120 5120]
-
blk.29.attn_v.weightF16[5120 1280]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.ffn_down.weightF16[17920 5120]
-
blk.30.ffn_gate.weightF16[5120 17920]
-
blk.30.ffn_up.weightF16[5120 17920]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.30.attn_k.weightF16[5120 1280]
-
blk.30.attn_output.weightF16[5120 5120]
-
blk.30.attn_q.weightF16[5120 5120]
-
blk.30.attn_v.weightF16[5120 1280]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.ffn_down.weightF16[17920 5120]
-
blk.31.ffn_gate.weightF16[5120 17920]
-
blk.31.ffn_up.weightF16[5120 17920]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.attn_k.weightF16[5120 1280]
-
blk.31.attn_output.weightF16[5120 5120]
-
blk.31.attn_q.weightF16[5120 5120]
-
blk.31.attn_v.weightF16[5120 1280]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.ffn_down.weightF16[17920 5120]
-
blk.32.ffn_gate.weightF16[5120 17920]
-
blk.32.ffn_up.weightF16[5120 17920]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.32.attn_k.weightF16[5120 1280]
-
blk.32.attn_output.weightF16[5120 5120]
-
blk.32.attn_q.weightF16[5120 5120]
-
blk.32.attn_v.weightF16[5120 1280]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.ffn_down.weightF16[17920 5120]
-
blk.33.ffn_gate.weightF16[5120 17920]
-
blk.33.ffn_up.weightF16[5120 17920]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.33.attn_k.weightF16[5120 1280]
-
blk.33.attn_output.weightF16[5120 5120]
-
blk.33.attn_q.weightF16[5120 5120]
-
blk.33.attn_v.weightF16[5120 1280]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.ffn_down.weightF16[17920 5120]
-
blk.34.ffn_gate.weightF16[5120 17920]
-
blk.34.ffn_up.weightF16[5120 17920]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.34.attn_k.weightF16[5120 1280]
-
blk.34.attn_output.weightF16[5120 5120]
-
blk.34.attn_q.weightF16[5120 5120]
-
blk.34.attn_v.weightF16[5120 1280]
-
blk.35.ffn_gate.weightF16[5120 17920]
-
blk.35.ffn_up.weightF16[5120 17920]
-
blk.35.attn_k.weightF16[5120 1280]
-
blk.35.attn_output.weightF16[5120 5120]
-
blk.35.attn_q.weightF16[5120 5120]
-
blk.35.attn_v.weightF16[5120 1280]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.ffn_down.weightF16[17920 5120]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.ffn_down.weightF16[17920 5120]
-
blk.36.ffn_gate.weightF16[5120 17920]
-
blk.36.ffn_up.weightF16[5120 17920]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.36.attn_k.weightF16[5120 1280]
-
blk.36.attn_output.weightF16[5120 5120]
-
blk.36.attn_q.weightF16[5120 5120]
-
blk.36.attn_v.weightF16[5120 1280]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.ffn_down.weightF16[17920 5120]
-
blk.37.ffn_gate.weightF16[5120 17920]
-
blk.37.ffn_up.weightF16[5120 17920]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.attn_k.weightF16[5120 1280]
-
blk.37.attn_output.weightF16[5120 5120]
-
blk.37.attn_q.weightF16[5120 5120]
-
blk.37.attn_v.weightF16[5120 1280]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.ffn_down.weightF16[17920 5120]
-
blk.38.ffn_gate.weightF16[5120 17920]
-
blk.38.ffn_up.weightF16[5120 17920]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.38.attn_k.weightF16[5120 1280]
-
blk.38.attn_output.weightF16[5120 5120]
-
blk.38.attn_q.weightF16[5120 5120]
-
blk.38.attn_v.weightF16[5120 1280]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.ffn_down.weightF16[17920 5120]
-
blk.39.ffn_gate.weightF16[5120 17920]
-
blk.39.ffn_up.weightF16[5120 17920]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.attn_k.weightF16[5120 1280]
-
blk.39.attn_output.weightF16[5120 5120]
-
blk.39.attn_q.weightF16[5120 5120]
-
blk.39.attn_v.weightF16[5120 1280]
-
blk.40.attn_norm.weightF32[5120]
-
blk.40.ffn_down.weightF16[17920 5120]
-
blk.40.ffn_gate.weightF16[5120 17920]
-
blk.40.ffn_up.weightF16[5120 17920]
-
blk.40.ffn_norm.weightF32[5120]
-
blk.40.attn_k.weightF16[5120 1280]
-
blk.40.attn_output.weightF16[5120 5120]
-
blk.40.attn_q.weightF16[5120 5120]
-
blk.40.attn_v.weightF16[5120 1280]
-
blk.41.attn_norm.weightF32[5120]
-
blk.41.ffn_down.weightF16[17920 5120]
-
blk.41.ffn_gate.weightF16[5120 17920]
-
blk.41.ffn_up.weightF16[5120 17920]
-
blk.41.ffn_norm.weightF32[5120]
-
blk.41.attn_k.weightF16[5120 1280]
-
blk.41.attn_output.weightF16[5120 5120]
-
blk.41.attn_q.weightF16[5120 5120]
-
blk.41.attn_v.weightF16[5120 1280]
-
blk.42.attn_norm.weightF32[5120]
-
blk.42.ffn_down.weightF16[17920 5120]
-
blk.42.ffn_gate.weightF16[5120 17920]
-
blk.42.ffn_up.weightF16[5120 17920]
-
blk.42.ffn_norm.weightF32[5120]
-
blk.42.attn_k.weightF16[5120 1280]
-
blk.42.attn_output.weightF16[5120 5120]
-
blk.42.attn_q.weightF16[5120 5120]
-
blk.42.attn_v.weightF16[5120 1280]
-
blk.43.attn_norm.weightF32[5120]
-
blk.43.ffn_down.weightF16[17920 5120]
-
blk.43.ffn_gate.weightF16[5120 17920]
-
blk.43.ffn_up.weightF16[5120 17920]
-
blk.43.ffn_norm.weightF32[5120]
-
blk.43.attn_k.weightF16[5120 1280]
-
blk.43.attn_output.weightF16[5120 5120]
-
blk.43.attn_q.weightF16[5120 5120]
-
blk.43.attn_v.weightF16[5120 1280]
-
blk.44.attn_norm.weightF32[5120]
-
blk.44.ffn_down.weightF16[17920 5120]
-
blk.44.ffn_gate.weightF16[5120 17920]
-
blk.44.ffn_up.weightF16[5120 17920]
-
blk.44.ffn_norm.weightF32[5120]
-
blk.44.attn_k.weightF16[5120 1280]
-
blk.44.attn_output.weightF16[5120 5120]
-
blk.44.attn_q.weightF16[5120 5120]
-
blk.44.attn_v.weightF16[5120 1280]
-
blk.45.attn_norm.weightF32[5120]
-
blk.45.ffn_down.weightF16[17920 5120]
-
blk.45.ffn_gate.weightF16[5120 17920]
-
blk.45.ffn_up.weightF16[5120 17920]
-
blk.45.ffn_norm.weightF32[5120]
-
blk.45.attn_k.weightF16[5120 1280]
-
blk.45.attn_output.weightF16[5120 5120]
-
blk.45.attn_q.weightF16[5120 5120]
-
blk.45.attn_v.weightF16[5120 1280]
-
blk.46.attn_norm.weightF32[5120]
-
blk.46.ffn_down.weightF16[17920 5120]
-
blk.46.ffn_gate.weightF16[5120 17920]
-
blk.46.ffn_up.weightF16[5120 17920]
-
blk.46.ffn_norm.weightF32[5120]
-
blk.46.attn_k.weightF16[5120 1280]
-
blk.46.attn_output.weightF16[5120 5120]
-
blk.46.attn_q.weightF16[5120 5120]
-
blk.46.attn_v.weightF16[5120 1280]
-
blk.47.attn_norm.weightF32[5120]
-
blk.47.ffn_down.weightF16[17920 5120]
-
blk.47.ffn_gate.weightF16[5120 17920]
-
blk.47.ffn_up.weightF16[5120 17920]
-
blk.47.ffn_norm.weightF32[5120]
-
blk.47.attn_k.weightF16[5120 1280]
-
blk.47.attn_output.weightF16[5120 5120]
-
blk.47.attn_q.weightF16[5120 5120]
-
blk.47.attn_v.weightF16[5120 1280]
-
blk.48.attn_norm.weightF32[5120]
-
blk.48.ffn_down.weightF16[17920 5120]
-
blk.48.ffn_gate.weightF16[5120 17920]
-
blk.48.ffn_up.weightF16[5120 17920]
-
blk.48.ffn_norm.weightF32[5120]
-
blk.48.attn_k.weightF16[5120 1280]
-
blk.48.attn_output.weightF16[5120 5120]
-
blk.48.attn_q.weightF16[5120 5120]
-
blk.48.attn_v.weightF16[5120 1280]
-
blk.49.attn_norm.weightF32[5120]
-
blk.49.ffn_down.weightF16[17920 5120]
-
blk.49.ffn_gate.weightF16[5120 17920]
-
blk.49.ffn_up.weightF16[5120 17920]
-
blk.49.ffn_norm.weightF32[5120]
-
blk.49.attn_k.weightF16[5120 1280]
-
blk.49.attn_output.weightF16[5120 5120]
-
blk.49.attn_q.weightF16[5120 5120]
-
blk.49.attn_v.weightF16[5120 1280]
-
blk.50.attn_k.weightF16[5120 1280]
-
blk.50.attn_output.weightF16[5120 5120]
-
blk.50.attn_q.weightF16[5120 5120]
-
blk.50.attn_v.weightF16[5120 1280]
-
blk.50.attn_norm.weightF32[5120]
-
blk.50.ffn_down.weightF16[17920 5120]
-
blk.50.ffn_gate.weightF16[5120 17920]
-
blk.50.ffn_up.weightF16[5120 17920]
-
blk.50.ffn_norm.weightF32[5120]
-
blk.51.attn_norm.weightF32[5120]
-
blk.51.ffn_down.weightF16[17920 5120]
-
blk.51.ffn_gate.weightF16[5120 17920]
-
blk.51.ffn_up.weightF16[5120 17920]
-
blk.51.ffn_norm.weightF32[5120]
-
blk.51.attn_k.weightF16[5120 1280]
-
blk.51.attn_output.weightF16[5120 5120]
-
blk.51.attn_q.weightF16[5120 5120]
-
blk.51.attn_v.weightF16[5120 1280]
-
blk.52.attn_norm.weightF32[5120]
-
blk.52.ffn_down.weightF16[17920 5120]
-
blk.52.ffn_gate.weightF16[5120 17920]
-
blk.52.ffn_up.weightF16[5120 17920]
-
blk.52.ffn_norm.weightF32[5120]
-
blk.52.attn_k.weightF16[5120 1280]
-
blk.52.attn_output.weightF16[5120 5120]
-
blk.52.attn_q.weightF16[5120 5120]
-
blk.52.attn_v.weightF16[5120 1280]
-
blk.53.attn_norm.weightF32[5120]
-
blk.53.ffn_down.weightF16[17920 5120]
-
blk.53.ffn_gate.weightF16[5120 17920]
-
blk.53.ffn_up.weightF16[5120 17920]
-
blk.53.ffn_norm.weightF32[5120]
-
blk.53.attn_k.weightF16[5120 1280]
-
blk.53.attn_output.weightF16[5120 5120]
-
blk.53.attn_q.weightF16[5120 5120]
-
blk.53.attn_v.weightF16[5120 1280]
-
blk.54.attn_norm.weightF32[5120]
-
blk.54.ffn_down.weightF16[17920 5120]
-
blk.54.ffn_gate.weightF16[5120 17920]
-
blk.54.ffn_up.weightF16[5120 17920]
-
blk.54.ffn_norm.weightF32[5120]
-
blk.54.attn_k.weightF16[5120 1280]
-
blk.54.attn_output.weightF16[5120 5120]
-
blk.54.attn_q.weightF16[5120 5120]
-
blk.54.attn_v.weightF16[5120 1280]
-
blk.55.attn_norm.weightF32[5120]
-
blk.55.ffn_down.weightF16[17920 5120]
-
blk.55.ffn_gate.weightF16[5120 17920]
-
blk.55.ffn_up.weightF16[5120 17920]
-
blk.55.ffn_norm.weightF32[5120]
-
blk.55.attn_k.weightF16[5120 1280]
-
blk.55.attn_output.weightF16[5120 5120]
-
blk.55.attn_q.weightF16[5120 5120]
-
blk.55.attn_v.weightF16[5120 1280]
-
blk.56.attn_norm.weightF32[5120]
-
blk.56.ffn_down.weightF16[17920 5120]
-
blk.56.ffn_gate.weightF16[5120 17920]
-
blk.56.ffn_up.weightF16[5120 17920]
-
blk.56.ffn_norm.weightF32[5120]
-
blk.56.attn_k.weightF16[5120 1280]
-
blk.56.attn_output.weightF16[5120 5120]
-
blk.56.attn_q.weightF16[5120 5120]
-
blk.56.attn_v.weightF16[5120 1280]
-
blk.57.ffn_gate.weightF16[5120 17920]
-
blk.57.attn_k.weightF16[5120 1280]
-
blk.57.attn_output.weightF16[5120 5120]
-
blk.57.attn_q.weightF16[5120 5120]
-
blk.57.attn_v.weightF16[5120 1280]
-
blk.57.attn_norm.weightF32[5120]
-
blk.57.ffn_down.weightF16[17920 5120]
-
blk.57.ffn_up.weightF16[5120 17920]
-
blk.57.ffn_norm.weightF32[5120]
-
blk.58.attn_norm.weightF32[5120]
-
blk.58.ffn_down.weightF16[17920 5120]
-
blk.58.ffn_gate.weightF16[5120 17920]
-
blk.58.ffn_up.weightF16[5120 17920]
-
blk.58.ffn_norm.weightF32[5120]
-
blk.58.attn_k.weightF16[5120 1280]
-
blk.58.attn_output.weightF16[5120 5120]
-
blk.58.attn_q.weightF16[5120 5120]
-
blk.58.attn_v.weightF16[5120 1280]
-
blk.59.attn_norm.weightF32[5120]
-
blk.59.ffn_down.weightF16[17920 5120]
-
blk.59.ffn_gate.weightF16[5120 17920]
-
blk.59.ffn_up.weightF16[5120 17920]
-
blk.59.ffn_norm.weightF32[5120]
-
blk.59.attn_k.weightF16[5120 1280]
-
blk.59.attn_output.weightF16[5120 5120]
-
blk.59.attn_q.weightF16[5120 5120]
-
blk.59.attn_v.weightF16[5120 1280]
-
blk.60.attn_norm.weightF32[5120]
-
blk.60.ffn_down.weightF16[17920 5120]
-
blk.60.ffn_gate.weightF16[5120 17920]
-
blk.60.ffn_up.weightF16[5120 17920]
-
blk.60.ffn_norm.weightF32[5120]
-
blk.60.attn_k.weightF16[5120 1280]
-
blk.60.attn_output.weightF16[5120 5120]
-
blk.60.attn_q.weightF16[5120 5120]
-
blk.60.attn_v.weightF16[5120 1280]
-
blk.61.attn_norm.weightF32[5120]
-
blk.61.ffn_down.weightF16[17920 5120]
-
blk.61.ffn_gate.weightF16[5120 17920]
-
blk.61.ffn_up.weightF16[5120 17920]
-
blk.61.ffn_norm.weightF32[5120]
-
blk.61.attn_k.weightF16[5120 1280]
-
blk.61.attn_output.weightF16[5120 5120]
-
blk.61.attn_q.weightF16[5120 5120]
-
blk.61.attn_v.weightF16[5120 1280]
-
blk.62.attn_norm.weightF32[5120]
-
blk.62.ffn_down.weightF16[17920 5120]
-
blk.62.ffn_gate.weightF16[5120 17920]
-
blk.62.ffn_up.weightF16[5120 17920]
-
blk.62.ffn_norm.weightF32[5120]
-
blk.62.attn_k.weightF16[5120 1280]
-
blk.62.attn_output.weightF16[5120 5120]
-
blk.62.attn_q.weightF16[5120 5120]
-
blk.62.attn_v.weightF16[5120 1280]
-
blk.63.attn_norm.weightF32[5120]
-
blk.63.ffn_down.weightF16[17920 5120]
-
blk.63.ffn_gate.weightF16[5120 17920]
-
blk.63.ffn_up.weightF16[5120 17920]
-
blk.63.ffn_norm.weightF32[5120]
-
blk.63.attn_k.weightF16[5120 1280]
-
blk.63.attn_output.weightF16[5120 5120]
-
blk.63.attn_q.weightF16[5120 5120]
-
blk.63.attn_v.weightF16[5120 1280]
-
output.weightF16[5120 32128]
-
output_norm.weightF32[5120]
-
bskcn_tv.weightF32[2]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55
blk.56
blk.57
blk.58
blk.59
blk.60
blk.61
blk.62
blk.63