Original version released Apritl 15th of WizardLM 2
8x22B
126 Pulls Updated 5 months ago
8acfb2ac416b · 281GB
-
general.architecturellama
-
general.file_typeF16
-
llama.attention.head_count48
-
llama.attention.head_count_kv8
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count56
-
llama.context_length65536
-
llama.embedding_length6144
-
llama.expert_count8
-
llama.expert_used_count2
-
llama.feed_forward_length16384
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+06
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[2 3 3 6 6 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> <0x00> <0x01> ...]
-
NameTypeShape
-
token_embd.weightF16[6144 32000]
-
blk.0.ffn_gate.0.weightF16[6144 16384]
-
blk.0.ffn_down.0.weightF16[16384 6144]
-
blk.0.ffn_up.0.weightF16[6144 16384]
-
blk.0.ffn_gate.1.weightF16[6144 16384]
-
blk.0.ffn_down.1.weightF16[16384 6144]
-
blk.0.ffn_up.1.weightF16[6144 16384]
-
blk.0.ffn_gate.2.weightF16[6144 16384]
-
blk.0.ffn_down.2.weightF16[16384 6144]
-
blk.0.ffn_up.2.weightF16[6144 16384]
-
blk.0.ffn_gate.3.weightF16[6144 16384]
-
blk.0.ffn_down.3.weightF16[16384 6144]
-
blk.0.ffn_up.3.weightF16[6144 16384]
-
blk.0.ffn_gate.4.weightF16[6144 16384]
-
blk.0.ffn_down.4.weightF16[16384 6144]
-
blk.0.ffn_up.4.weightF16[6144 16384]
-
blk.0.ffn_gate.5.weightF16[6144 16384]
-
blk.0.ffn_down.5.weightF16[16384 6144]
-
blk.0.ffn_up.5.weightF16[6144 16384]
-
blk.0.ffn_gate.6.weightF16[6144 16384]
-
blk.0.ffn_down.6.weightF16[16384 6144]
-
blk.0.ffn_up.6.weightF16[6144 16384]
-
blk.0.ffn_gate.7.weightF16[6144 16384]
-
blk.0.ffn_gate_inp.weightF16[6144 8]
-
blk.0.attn_k.weightF16[6144 1024]
-
blk.0.attn_output.weightF16[6144 6144]
-
blk.0.attn_q.weightF16[6144 6144]
-
blk.0.attn_v.weightF16[6144 1024]
-
blk.0.ffn_down.7.weightF16[16384 6144]
-
blk.0.ffn_up.7.weightF16[6144 16384]
-
blk.0.attn_norm.weightF32[6144]
-
blk.0.ffn_norm.weightF32[6144]
-
blk.1.ffn_gate.0.weightF16[6144 16384]
-
blk.1.ffn_down.0.weightF16[16384 6144]
-
blk.1.ffn_up.0.weightF16[6144 16384]
-
blk.1.ffn_gate.1.weightF16[6144 16384]
-
blk.1.ffn_down.1.weightF16[16384 6144]
-
blk.1.ffn_up.1.weightF16[6144 16384]
-
blk.1.ffn_gate.2.weightF16[6144 16384]
-
blk.1.ffn_down.2.weightF16[16384 6144]
-
blk.1.ffn_up.2.weightF16[6144 16384]
-
blk.1.ffn_gate.3.weightF16[6144 16384]
-
blk.1.ffn_down.3.weightF16[16384 6144]
-
blk.1.ffn_up.3.weightF16[6144 16384]
-
blk.1.ffn_gate.4.weightF16[6144 16384]
-
blk.1.ffn_down.4.weightF16[16384 6144]
-
blk.1.ffn_up.4.weightF16[6144 16384]
-
blk.1.ffn_gate.5.weightF16[6144 16384]
-
blk.1.ffn_down.5.weightF16[16384 6144]
-
blk.1.ffn_up.5.weightF16[6144 16384]
-
blk.1.ffn_gate.6.weightF16[6144 16384]
-
blk.1.ffn_down.6.weightF16[16384 6144]
-
blk.1.ffn_up.6.weightF16[6144 16384]
-
blk.1.ffn_gate_inp.weightF16[6144 8]
-
blk.1.attn_k.weightF16[6144 1024]
-
blk.1.attn_output.weightF16[6144 6144]
-
blk.1.attn_q.weightF16[6144 6144]
-
blk.1.attn_v.weightF16[6144 1024]
-
blk.1.ffn_gate.7.weightF16[6144 16384]
-
blk.1.ffn_down.7.weightF16[16384 6144]
-
blk.1.ffn_up.7.weightF16[6144 16384]
-
blk.1.attn_norm.weightF32[6144]
-
blk.1.ffn_norm.weightF32[6144]
-
blk.2.ffn_gate.0.weightF16[6144 16384]
-
blk.2.ffn_down.0.weightF16[16384 6144]
-
blk.2.ffn_up.0.weightF16[6144 16384]
-
blk.2.ffn_gate.1.weightF16[6144 16384]
-
blk.2.ffn_down.1.weightF16[16384 6144]
-
blk.2.ffn_up.1.weightF16[6144 16384]
-
blk.2.ffn_gate.2.weightF16[6144 16384]
-
blk.2.ffn_down.2.weightF16[16384 6144]
-
blk.2.ffn_up.2.weightF16[6144 16384]
-
blk.2.ffn_gate.3.weightF16[6144 16384]
-
blk.2.ffn_down.3.weightF16[16384 6144]
-
blk.2.ffn_up.3.weightF16[6144 16384]
-
blk.2.ffn_gate.4.weightF16[6144 16384]
-
blk.2.ffn_down.4.weightF16[16384 6144]
-
blk.2.ffn_up.4.weightF16[6144 16384]
-
blk.2.ffn_gate.5.weightF16[6144 16384]
-
blk.2.ffn_down.5.weightF16[16384 6144]
-
blk.2.ffn_up.5.weightF16[6144 16384]
-
blk.2.ffn_gate.6.weightF16[6144 16384]
-
blk.2.ffn_down.6.weightF16[16384 6144]
-
blk.2.ffn_gate_inp.weightF16[6144 8]
-
blk.2.attn_k.weightF16[6144 1024]
-
blk.2.attn_output.weightF16[6144 6144]
-
blk.2.attn_q.weightF16[6144 6144]
-
blk.2.attn_v.weightF16[6144 1024]
-
blk.2.ffn_up.6.weightF16[6144 16384]
-
blk.2.ffn_gate.7.weightF16[6144 16384]
-
blk.2.ffn_down.7.weightF16[16384 6144]
-
blk.2.ffn_up.7.weightF16[6144 16384]
-
blk.2.attn_norm.weightF32[6144]
-
blk.2.ffn_norm.weightF32[6144]
-
blk.3.ffn_gate.0.weightF16[6144 16384]
-
blk.3.ffn_down.0.weightF16[16384 6144]
-
blk.3.ffn_up.0.weightF16[6144 16384]
-
blk.3.ffn_gate.1.weightF16[6144 16384]
-
blk.3.ffn_down.1.weightF16[16384 6144]
-
blk.3.ffn_up.1.weightF16[6144 16384]
-
blk.3.ffn_gate.2.weightF16[6144 16384]
-
blk.3.ffn_down.2.weightF16[16384 6144]
-
blk.3.ffn_up.2.weightF16[6144 16384]
-
blk.3.ffn_gate.3.weightF16[6144 16384]
-
blk.3.ffn_down.3.weightF16[16384 6144]
-
blk.3.ffn_up.3.weightF16[6144 16384]
-
blk.3.ffn_gate.4.weightF16[6144 16384]
-
blk.3.ffn_down.4.weightF16[16384 6144]
-
blk.3.ffn_up.4.weightF16[6144 16384]
-
blk.3.ffn_gate.5.weightF16[6144 16384]
-
blk.3.ffn_down.5.weightF16[16384 6144]
-
blk.3.ffn_up.5.weightF16[6144 16384]
-
blk.3.ffn_gate.6.weightF16[6144 16384]
-
blk.3.ffn_gate_inp.weightF16[6144 8]
-
blk.3.attn_k.weightF16[6144 1024]
-
blk.3.attn_output.weightF16[6144 6144]
-
blk.3.attn_q.weightF16[6144 6144]
-
blk.3.attn_v.weightF16[6144 1024]
-
blk.3.ffn_down.6.weightF16[16384 6144]
-
blk.3.ffn_up.6.weightF16[6144 16384]
-
blk.3.ffn_gate.7.weightF16[6144 16384]
-
blk.3.ffn_down.7.weightF16[16384 6144]
-
blk.3.ffn_up.7.weightF16[6144 16384]
-
blk.3.attn_norm.weightF32[6144]
-
blk.3.ffn_norm.weightF32[6144]
-
blk.4.ffn_gate.0.weightF16[6144 16384]
-
blk.4.ffn_down.0.weightF16[16384 6144]
-
blk.4.ffn_up.0.weightF16[6144 16384]
-
blk.4.ffn_gate.1.weightF16[6144 16384]
-
blk.4.ffn_down.1.weightF16[16384 6144]
-
blk.4.ffn_up.1.weightF16[6144 16384]
-
blk.4.ffn_gate.2.weightF16[6144 16384]
-
blk.4.ffn_down.2.weightF16[16384 6144]
-
blk.4.ffn_up.2.weightF16[6144 16384]
-
blk.4.ffn_gate.3.weightF16[6144 16384]
-
blk.4.ffn_down.3.weightF16[16384 6144]
-
blk.4.ffn_up.3.weightF16[6144 16384]
-
blk.4.ffn_gate.4.weightF16[6144 16384]
-
blk.4.ffn_down.4.weightF16[16384 6144]
-
blk.4.ffn_up.4.weightF16[6144 16384]
-
blk.4.ffn_gate.5.weightF16[6144 16384]
-
blk.4.ffn_down.5.weightF16[16384 6144]
-
blk.4.ffn_up.5.weightF16[6144 16384]
-
blk.4.ffn_gate_inp.weightF16[6144 8]
-
blk.4.attn_k.weightF16[6144 1024]
-
blk.4.attn_output.weightF16[6144 6144]
-
blk.4.attn_q.weightF16[6144 6144]
-
blk.4.attn_v.weightF16[6144 1024]
-
blk.4.ffn_gate.6.weightF16[6144 16384]
-
blk.4.ffn_down.6.weightF16[16384 6144]
-
blk.4.ffn_up.6.weightF16[6144 16384]
-
blk.4.ffn_gate.7.weightF16[6144 16384]
-
blk.4.ffn_down.7.weightF16[16384 6144]
-
blk.4.ffn_up.7.weightF16[6144 16384]
-
blk.4.attn_norm.weightF32[6144]
-
blk.4.ffn_norm.weightF32[6144]
-
blk.5.ffn_gate.0.weightF16[6144 16384]
-
blk.5.ffn_down.0.weightF16[16384 6144]
-
blk.5.ffn_up.0.weightF16[6144 16384]
-
blk.5.ffn_gate.1.weightF16[6144 16384]
-
blk.5.ffn_down.1.weightF16[16384 6144]
-
blk.5.ffn_up.1.weightF16[6144 16384]
-
blk.5.ffn_gate.2.weightF16[6144 16384]
-
blk.5.ffn_down.2.weightF16[16384 6144]
-
blk.5.ffn_up.2.weightF16[6144 16384]
-
blk.5.ffn_gate.3.weightF16[6144 16384]
-
blk.5.ffn_down.3.weightF16[16384 6144]
-
blk.5.ffn_up.3.weightF16[6144 16384]
-
blk.5.ffn_gate.4.weightF16[6144 16384]
-
blk.5.ffn_down.4.weightF16[16384 6144]
-
blk.5.ffn_up.4.weightF16[6144 16384]
-
blk.5.ffn_gate.5.weightF16[6144 16384]
-
blk.5.ffn_down.5.weightF16[16384 6144]
-
blk.5.ffn_gate_inp.weightF16[6144 8]
-
blk.5.attn_k.weightF16[6144 1024]
-
blk.5.attn_output.weightF16[6144 6144]
-
blk.5.attn_q.weightF16[6144 6144]
-
blk.5.attn_v.weightF16[6144 1024]
-
blk.5.ffn_up.5.weightF16[6144 16384]
-
blk.5.ffn_gate.6.weightF16[6144 16384]
-
blk.5.ffn_down.6.weightF16[16384 6144]
-
blk.5.ffn_up.6.weightF16[6144 16384]
-
blk.5.ffn_gate.7.weightF16[6144 16384]
-
blk.5.ffn_down.7.weightF16[16384 6144]
-
blk.5.ffn_up.7.weightF16[6144 16384]
-
blk.5.attn_norm.weightF32[6144]
-
blk.5.ffn_norm.weightF32[6144]
-
blk.6.ffn_gate.0.weightF16[6144 16384]
-
blk.6.ffn_down.0.weightF16[16384 6144]
-
blk.6.ffn_up.0.weightF16[6144 16384]
-
blk.6.ffn_gate.1.weightF16[6144 16384]
-
blk.6.ffn_down.1.weightF16[16384 6144]
-
blk.6.ffn_up.1.weightF16[6144 16384]
-
blk.6.ffn_gate.2.weightF16[6144 16384]
-
blk.6.ffn_down.2.weightF16[16384 6144]
-
blk.6.ffn_up.2.weightF16[6144 16384]
-
blk.6.ffn_gate.3.weightF16[6144 16384]
-
blk.6.ffn_down.3.weightF16[16384 6144]
-
blk.6.ffn_up.3.weightF16[6144 16384]
-
blk.6.ffn_gate.4.weightF16[6144 16384]
-
blk.6.ffn_down.4.weightF16[16384 6144]
-
blk.6.ffn_up.4.weightF16[6144 16384]
-
blk.6.ffn_gate.5.weightF16[6144 16384]
-
blk.6.ffn_gate_inp.weightF16[6144 8]
-
blk.6.attn_k.weightF16[6144 1024]
-
blk.6.attn_output.weightF16[6144 6144]
-
blk.6.attn_q.weightF16[6144 6144]
-
blk.6.attn_v.weightF16[6144 1024]
-
blk.6.ffn_down.5.weightF16[16384 6144]
-
blk.6.ffn_up.5.weightF16[6144 16384]
-
blk.6.ffn_gate.6.weightF16[6144 16384]
-
blk.6.ffn_down.6.weightF16[16384 6144]
-
blk.6.ffn_up.6.weightF16[6144 16384]
-
blk.6.ffn_gate.7.weightF16[6144 16384]
-
blk.6.ffn_down.7.weightF16[16384 6144]
-
blk.6.ffn_up.7.weightF16[6144 16384]
-
blk.6.attn_norm.weightF32[6144]
-
blk.6.ffn_norm.weightF32[6144]
-
blk.7.ffn_gate.0.weightF16[6144 16384]
-
blk.7.ffn_down.0.weightF16[16384 6144]
-
blk.7.ffn_up.0.weightF16[6144 16384]
-
blk.7.ffn_gate.1.weightF16[6144 16384]
-
blk.7.ffn_down.1.weightF16[16384 6144]
-
blk.7.ffn_up.1.weightF16[6144 16384]
-
blk.7.ffn_gate.2.weightF16[6144 16384]
-
blk.7.ffn_down.2.weightF16[16384 6144]
-
blk.7.ffn_up.2.weightF16[6144 16384]
-
blk.7.ffn_gate.3.weightF16[6144 16384]
-
blk.7.ffn_down.3.weightF16[16384 6144]
-
blk.7.ffn_up.3.weightF16[6144 16384]
-
blk.7.ffn_gate.4.weightF16[6144 16384]
-
blk.7.ffn_down.4.weightF16[16384 6144]
-
blk.7.ffn_up.4.weightF16[6144 16384]
-
blk.7.ffn_gate_inp.weightF16[6144 8]
-
blk.7.attn_k.weightF16[6144 1024]
-
blk.7.attn_output.weightF16[6144 6144]
-
blk.7.attn_q.weightF16[6144 6144]
-
blk.7.attn_v.weightF16[6144 1024]
-
blk.7.ffn_gate.5.weightF16[6144 16384]
-
blk.7.ffn_down.5.weightF16[16384 6144]
-
blk.7.ffn_up.5.weightF16[6144 16384]
-
blk.7.ffn_gate.6.weightF16[6144 16384]
-
blk.7.ffn_down.6.weightF16[16384 6144]
-
blk.7.ffn_up.6.weightF16[6144 16384]
-
blk.7.ffn_gate.7.weightF16[6144 16384]
-
blk.7.ffn_down.7.weightF16[16384 6144]
-
blk.7.ffn_up.7.weightF16[6144 16384]
-
blk.7.attn_norm.weightF32[6144]
-
blk.7.ffn_norm.weightF32[6144]
-
blk.8.ffn_gate.0.weightF16[6144 16384]
-
blk.8.ffn_down.0.weightF16[16384 6144]
-
blk.8.ffn_up.0.weightF16[6144 16384]
-
blk.8.ffn_gate.1.weightF16[6144 16384]
-
blk.8.ffn_down.1.weightF16[16384 6144]
-
blk.8.ffn_up.1.weightF16[6144 16384]
-
blk.8.ffn_gate.2.weightF16[6144 16384]
-
blk.8.ffn_down.2.weightF16[16384 6144]
-
blk.8.ffn_up.2.weightF16[6144 16384]
-
blk.8.ffn_gate.3.weightF16[6144 16384]
-
blk.8.ffn_down.3.weightF16[16384 6144]
-
blk.8.ffn_up.3.weightF16[6144 16384]
-
blk.8.ffn_gate.4.weightF16[6144 16384]
-
blk.8.ffn_down.4.weightF16[16384 6144]
-
blk.8.ffn_gate_inp.weightF16[6144 8]
-
blk.8.attn_k.weightF16[6144 1024]
-
blk.8.attn_output.weightF16[6144 6144]
-
blk.8.attn_q.weightF16[6144 6144]
-
blk.8.attn_v.weightF16[6144 1024]
-
blk.8.ffn_up.4.weightF16[6144 16384]
-
blk.8.ffn_gate.5.weightF16[6144 16384]
-
blk.8.ffn_down.5.weightF16[16384 6144]
-
blk.8.ffn_up.5.weightF16[6144 16384]
-
blk.8.ffn_gate.6.weightF16[6144 16384]
-
blk.8.ffn_down.6.weightF16[16384 6144]
-
blk.8.ffn_up.6.weightF16[6144 16384]
-
blk.8.ffn_gate.7.weightF16[6144 16384]
-
blk.8.ffn_down.7.weightF16[16384 6144]
-
blk.8.ffn_up.7.weightF16[6144 16384]
-
blk.8.attn_norm.weightF32[6144]
-
blk.8.ffn_norm.weightF32[6144]
-
blk.9.ffn_gate.0.weightF16[6144 16384]
-
blk.9.ffn_down.0.weightF16[16384 6144]
-
blk.9.ffn_up.0.weightF16[6144 16384]
-
blk.9.ffn_gate.1.weightF16[6144 16384]
-
blk.9.ffn_down.1.weightF16[16384 6144]
-
blk.9.ffn_up.1.weightF16[6144 16384]
-
blk.9.ffn_gate.2.weightF16[6144 16384]
-
blk.9.ffn_down.2.weightF16[16384 6144]
-
blk.9.ffn_up.2.weightF16[6144 16384]
-
blk.9.ffn_gate.3.weightF16[6144 16384]
-
blk.9.ffn_down.3.weightF16[16384 6144]
-
blk.9.ffn_up.3.weightF16[6144 16384]
-
blk.9.ffn_gate.4.weightF16[6144 16384]
-
blk.9.ffn_gate_inp.weightF16[6144 8]
-
blk.9.attn_k.weightF16[6144 1024]
-
blk.9.attn_output.weightF16[6144 6144]
-
blk.9.attn_q.weightF16[6144 6144]
-
blk.9.attn_v.weightF16[6144 1024]
-
blk.9.ffn_down.4.weightF16[16384 6144]
-
blk.9.ffn_up.4.weightF16[6144 16384]
-
blk.9.ffn_gate.5.weightF16[6144 16384]
-
blk.9.ffn_down.5.weightF16[16384 6144]
-
blk.9.ffn_up.5.weightF16[6144 16384]
-
blk.9.ffn_gate.6.weightF16[6144 16384]
-
blk.9.ffn_down.6.weightF16[16384 6144]
-
blk.9.ffn_up.6.weightF16[6144 16384]
-
blk.9.ffn_gate.7.weightF16[6144 16384]
-
blk.9.ffn_down.7.weightF16[16384 6144]
-
blk.9.ffn_up.7.weightF16[6144 16384]
-
blk.9.attn_norm.weightF32[6144]
-
blk.9.ffn_norm.weightF32[6144]
-
blk.10.ffn_gate.0.weightF16[6144 16384]
-
blk.10.ffn_down.0.weightF16[16384 6144]
-
blk.10.ffn_up.0.weightF16[6144 16384]
-
blk.10.ffn_gate.1.weightF16[6144 16384]
-
blk.10.ffn_down.1.weightF16[16384 6144]
-
blk.10.ffn_up.1.weightF16[6144 16384]
-
blk.10.ffn_gate.2.weightF16[6144 16384]
-
blk.10.ffn_down.2.weightF16[16384 6144]
-
blk.10.ffn_up.2.weightF16[6144 16384]
-
blk.10.ffn_gate.3.weightF16[6144 16384]
-
blk.10.ffn_down.3.weightF16[16384 6144]
-
blk.10.ffn_up.3.weightF16[6144 16384]
-
blk.10.ffn_gate_inp.weightF16[6144 8]
-
blk.10.attn_k.weightF16[6144 1024]
-
blk.10.attn_output.weightF16[6144 6144]
-
blk.10.attn_q.weightF16[6144 6144]
-
blk.10.attn_v.weightF16[6144 1024]
-
blk.10.ffn_gate.4.weightF16[6144 16384]
-
blk.10.ffn_down.4.weightF16[16384 6144]
-
blk.10.ffn_up.4.weightF16[6144 16384]
-
blk.10.ffn_gate.5.weightF16[6144 16384]
-
blk.10.ffn_down.5.weightF16[16384 6144]
-
blk.10.ffn_up.5.weightF16[6144 16384]
-
blk.10.ffn_gate.6.weightF16[6144 16384]
-
blk.10.ffn_down.6.weightF16[16384 6144]
-
blk.10.ffn_up.6.weightF16[6144 16384]
-
blk.10.ffn_gate.7.weightF16[6144 16384]
-
blk.10.ffn_down.7.weightF16[16384 6144]
-
blk.10.ffn_up.7.weightF16[6144 16384]
-
blk.10.attn_norm.weightF32[6144]
-
blk.10.ffn_norm.weightF32[6144]
-
blk.11.ffn_gate.0.weightF16[6144 16384]
-
blk.11.ffn_down.0.weightF16[16384 6144]
-
blk.11.ffn_up.0.weightF16[6144 16384]
-
blk.11.ffn_gate.1.weightF16[6144 16384]
-
blk.11.ffn_down.1.weightF16[16384 6144]
-
blk.11.ffn_up.1.weightF16[6144 16384]
-
blk.11.ffn_gate.2.weightF16[6144 16384]
-
blk.11.ffn_down.2.weightF16[16384 6144]
-
blk.11.ffn_up.2.weightF16[6144 16384]
-
blk.11.ffn_gate.3.weightF16[6144 16384]
-
blk.11.ffn_down.3.weightF16[16384 6144]
-
blk.11.ffn_gate_inp.weightF16[6144 8]
-
blk.11.attn_k.weightF16[6144 1024]
-
blk.11.attn_output.weightF16[6144 6144]
-
blk.11.attn_q.weightF16[6144 6144]
-
blk.11.attn_v.weightF16[6144 1024]
-
blk.11.ffn_up.3.weightF16[6144 16384]
-
blk.11.ffn_gate.4.weightF16[6144 16384]
-
blk.11.ffn_down.4.weightF16[16384 6144]
-
blk.11.ffn_up.4.weightF16[6144 16384]
-
blk.11.ffn_gate.5.weightF16[6144 16384]
-
blk.11.ffn_down.5.weightF16[16384 6144]
-
blk.11.ffn_up.5.weightF16[6144 16384]
-
blk.11.ffn_gate.6.weightF16[6144 16384]
-
blk.11.ffn_down.6.weightF16[16384 6144]
-
blk.11.ffn_up.6.weightF16[6144 16384]
-
blk.11.ffn_gate.7.weightF16[6144 16384]
-
blk.11.ffn_down.7.weightF16[16384 6144]
-
blk.11.ffn_up.7.weightF16[6144 16384]
-
blk.11.attn_norm.weightF32[6144]
-
blk.11.ffn_norm.weightF32[6144]
-
blk.12.ffn_gate.0.weightF16[6144 16384]
-
blk.12.ffn_down.0.weightF16[16384 6144]
-
blk.12.ffn_up.0.weightF16[6144 16384]
-
blk.12.ffn_gate.1.weightF16[6144 16384]
-
blk.12.ffn_down.1.weightF16[16384 6144]
-
blk.12.ffn_up.1.weightF16[6144 16384]
-
blk.12.ffn_gate.2.weightF16[6144 16384]
-
blk.12.ffn_down.2.weightF16[16384 6144]
-
blk.12.ffn_up.2.weightF16[6144 16384]
-
blk.12.ffn_gate.3.weightF16[6144 16384]
-
blk.12.ffn_gate_inp.weightF16[6144 8]
-
blk.12.attn_k.weightF16[6144 1024]
-
blk.12.attn_output.weightF16[6144 6144]
-
blk.12.attn_q.weightF16[6144 6144]
-
blk.12.attn_v.weightF16[6144 1024]
-
blk.12.ffn_down.3.weightF16[16384 6144]
-
blk.12.ffn_up.3.weightF16[6144 16384]
-
blk.12.ffn_gate.4.weightF16[6144 16384]
-
blk.12.ffn_down.4.weightF16[16384 6144]
-
blk.12.ffn_up.4.weightF16[6144 16384]
-
blk.12.ffn_gate.5.weightF16[6144 16384]
-
blk.12.ffn_down.5.weightF16[16384 6144]
-
blk.12.ffn_up.5.weightF16[6144 16384]
-
blk.12.ffn_gate.6.weightF16[6144 16384]
-
blk.12.ffn_down.6.weightF16[16384 6144]
-
blk.12.ffn_up.6.weightF16[6144 16384]
-
blk.12.ffn_gate.7.weightF16[6144 16384]
-
blk.12.ffn_down.7.weightF16[16384 6144]
-
blk.12.ffn_up.7.weightF16[6144 16384]
-
blk.12.attn_norm.weightF32[6144]
-
blk.12.ffn_norm.weightF32[6144]
-
blk.13.ffn_gate.0.weightF16[6144 16384]
-
blk.13.ffn_down.0.weightF16[16384 6144]
-
blk.13.ffn_up.0.weightF16[6144 16384]
-
blk.13.ffn_gate.1.weightF16[6144 16384]
-
blk.13.ffn_down.1.weightF16[16384 6144]
-
blk.13.ffn_up.1.weightF16[6144 16384]
-
blk.13.ffn_gate.2.weightF16[6144 16384]
-
blk.13.ffn_down.2.weightF16[16384 6144]
-
blk.13.ffn_up.2.weightF16[6144 16384]
-
blk.13.ffn_gate_inp.weightF16[6144 8]
-
blk.13.attn_k.weightF16[6144 1024]
-
blk.13.attn_output.weightF16[6144 6144]
-
blk.13.attn_q.weightF16[6144 6144]
-
blk.13.attn_v.weightF16[6144 1024]
-
blk.13.ffn_gate.3.weightF16[6144 16384]
-
blk.13.ffn_down.3.weightF16[16384 6144]
-
blk.13.ffn_up.3.weightF16[6144 16384]
-
blk.13.ffn_gate.4.weightF16[6144 16384]
-
blk.13.ffn_down.4.weightF16[16384 6144]
-
blk.13.ffn_up.4.weightF16[6144 16384]
-
blk.13.ffn_gate.5.weightF16[6144 16384]
-
blk.13.ffn_down.5.weightF16[16384 6144]
-
blk.13.ffn_up.5.weightF16[6144 16384]
-
blk.13.ffn_gate.6.weightF16[6144 16384]
-
blk.13.ffn_down.6.weightF16[16384 6144]
-
blk.13.ffn_up.6.weightF16[6144 16384]
-
blk.13.ffn_gate.7.weightF16[6144 16384]
-
blk.13.ffn_down.7.weightF16[16384 6144]
-
blk.13.ffn_up.7.weightF16[6144 16384]
-
blk.13.attn_norm.weightF32[6144]
-
blk.13.ffn_norm.weightF32[6144]
-
blk.14.ffn_gate.0.weightF16[6144 16384]
-
blk.14.ffn_down.0.weightF16[16384 6144]
-
blk.14.ffn_up.0.weightF16[6144 16384]
-
blk.14.ffn_gate.1.weightF16[6144 16384]
-
blk.14.ffn_down.1.weightF16[16384 6144]
-
blk.14.ffn_up.1.weightF16[6144 16384]
-
blk.14.ffn_gate.2.weightF16[6144 16384]
-
blk.14.ffn_down.2.weightF16[16384 6144]
-
blk.14.ffn_gate_inp.weightF16[6144 8]
-
blk.14.attn_k.weightF16[6144 1024]
-
blk.14.attn_output.weightF16[6144 6144]
-
blk.14.attn_q.weightF16[6144 6144]
-
blk.14.attn_v.weightF16[6144 1024]
-
blk.14.ffn_up.2.weightF16[6144 16384]
-
blk.14.ffn_gate.3.weightF16[6144 16384]
-
blk.14.ffn_down.3.weightF16[16384 6144]
-
blk.14.ffn_up.3.weightF16[6144 16384]
-
blk.14.ffn_gate.4.weightF16[6144 16384]
-
blk.14.ffn_down.4.weightF16[16384 6144]
-
blk.14.ffn_up.4.weightF16[6144 16384]
-
blk.14.ffn_gate.5.weightF16[6144 16384]
-
blk.14.ffn_down.5.weightF16[16384 6144]
-
blk.14.ffn_up.5.weightF16[6144 16384]
-
blk.14.ffn_gate.6.weightF16[6144 16384]
-
blk.14.ffn_down.6.weightF16[16384 6144]
-
blk.14.ffn_up.6.weightF16[6144 16384]
-
blk.14.ffn_gate.7.weightF16[6144 16384]
-
blk.14.ffn_down.7.weightF16[16384 6144]
-
blk.14.ffn_up.7.weightF16[6144 16384]
-
blk.14.attn_norm.weightF32[6144]
-
blk.14.ffn_norm.weightF32[6144]
-
blk.15.ffn_gate.0.weightF16[6144 16384]
-
blk.15.ffn_down.0.weightF16[16384 6144]
-
blk.15.ffn_up.0.weightF16[6144 16384]
-
blk.15.ffn_gate.1.weightF16[6144 16384]
-
blk.15.ffn_down.1.weightF16[16384 6144]
-
blk.15.ffn_up.1.weightF16[6144 16384]
-
blk.15.ffn_gate.2.weightF16[6144 16384]
-
blk.15.ffn_gate_inp.weightF16[6144 8]
-
blk.15.attn_k.weightF16[6144 1024]
-
blk.15.attn_output.weightF16[6144 6144]
-
blk.15.attn_q.weightF16[6144 6144]
-
blk.15.attn_v.weightF16[6144 1024]
-
blk.15.ffn_down.2.weightF16[16384 6144]
-
blk.15.ffn_up.2.weightF16[6144 16384]
-
blk.15.ffn_gate.3.weightF16[6144 16384]
-
blk.15.ffn_down.3.weightF16[16384 6144]
-
blk.15.ffn_up.3.weightF16[6144 16384]
-
blk.15.ffn_gate.4.weightF16[6144 16384]
-
blk.15.ffn_down.4.weightF16[16384 6144]
-
blk.15.ffn_up.4.weightF16[6144 16384]
-
blk.15.ffn_gate.5.weightF16[6144 16384]
-
blk.15.ffn_down.5.weightF16[16384 6144]
-
blk.15.ffn_up.5.weightF16[6144 16384]
-
blk.15.ffn_gate.6.weightF16[6144 16384]
-
blk.15.ffn_down.6.weightF16[16384 6144]
-
blk.15.ffn_up.6.weightF16[6144 16384]
-
blk.15.ffn_gate.7.weightF16[6144 16384]
-
blk.15.ffn_down.7.weightF16[16384 6144]
-
blk.15.ffn_up.7.weightF16[6144 16384]
-
blk.15.attn_norm.weightF32[6144]
-
blk.15.ffn_norm.weightF32[6144]
-
blk.16.ffn_gate.0.weightF16[6144 16384]
-
blk.16.ffn_down.0.weightF16[16384 6144]
-
blk.16.ffn_up.0.weightF16[6144 16384]
-
blk.16.ffn_gate.1.weightF16[6144 16384]
-
blk.16.ffn_down.1.weightF16[16384 6144]
-
blk.16.ffn_up.1.weightF16[6144 16384]
-
blk.16.ffn_gate_inp.weightF16[6144 8]
-
blk.16.attn_k.weightF16[6144 1024]
-
blk.16.attn_output.weightF16[6144 6144]
-
blk.16.attn_q.weightF16[6144 6144]
-
blk.16.attn_v.weightF16[6144 1024]
-
blk.16.ffn_gate.2.weightF16[6144 16384]
-
blk.16.ffn_down.2.weightF16[16384 6144]
-
blk.16.ffn_up.2.weightF16[6144 16384]
-
blk.16.ffn_gate.3.weightF16[6144 16384]
-
blk.16.ffn_down.3.weightF16[16384 6144]
-
blk.16.ffn_up.3.weightF16[6144 16384]
-
blk.16.ffn_gate.4.weightF16[6144 16384]
-
blk.16.ffn_down.4.weightF16[16384 6144]
-
blk.16.ffn_up.4.weightF16[6144 16384]
-
blk.16.ffn_gate.5.weightF16[6144 16384]
-
blk.16.ffn_down.5.weightF16[16384 6144]
-
blk.16.ffn_up.5.weightF16[6144 16384]
-
blk.16.ffn_gate.6.weightF16[6144 16384]
-
blk.16.ffn_down.6.weightF16[16384 6144]
-
blk.16.ffn_up.6.weightF16[6144 16384]
-
blk.16.ffn_gate.7.weightF16[6144 16384]
-
blk.16.ffn_down.7.weightF16[16384 6144]
-
blk.16.ffn_up.7.weightF16[6144 16384]
-
blk.16.attn_norm.weightF32[6144]
-
blk.16.ffn_norm.weightF32[6144]
-
blk.17.ffn_gate.0.weightF16[6144 16384]
-
blk.17.ffn_down.0.weightF16[16384 6144]
-
blk.17.ffn_up.0.weightF16[6144 16384]
-
blk.17.ffn_gate.1.weightF16[6144 16384]
-
blk.17.ffn_down.1.weightF16[16384 6144]
-
blk.17.ffn_gate_inp.weightF16[6144 8]
-
blk.17.attn_k.weightF16[6144 1024]
-
blk.17.attn_output.weightF16[6144 6144]
-
blk.17.attn_q.weightF16[6144 6144]
-
blk.17.attn_v.weightF16[6144 1024]
-
blk.17.ffn_up.1.weightF16[6144 16384]
-
blk.17.ffn_gate.2.weightF16[6144 16384]
-
blk.17.ffn_down.2.weightF16[16384 6144]
-
blk.17.ffn_up.2.weightF16[6144 16384]
-
blk.17.ffn_gate.3.weightF16[6144 16384]
-
blk.17.ffn_down.3.weightF16[16384 6144]
-
blk.17.ffn_up.3.weightF16[6144 16384]
-
blk.17.ffn_gate.4.weightF16[6144 16384]
-
blk.17.ffn_down.4.weightF16[16384 6144]
-
blk.17.ffn_up.4.weightF16[6144 16384]
-
blk.17.ffn_gate.5.weightF16[6144 16384]
-
blk.17.ffn_down.5.weightF16[16384 6144]
-
blk.17.ffn_up.5.weightF16[6144 16384]
-
blk.17.ffn_gate.6.weightF16[6144 16384]
-
blk.17.ffn_down.6.weightF16[16384 6144]
-
blk.17.ffn_up.6.weightF16[6144 16384]
-
blk.17.ffn_gate.7.weightF16[6144 16384]
-
blk.17.ffn_down.7.weightF16[16384 6144]
-
blk.17.ffn_up.7.weightF16[6144 16384]
-
blk.17.attn_norm.weightF32[6144]
-
blk.17.ffn_norm.weightF32[6144]
-
blk.18.ffn_gate.0.weightF16[6144 16384]
-
blk.18.ffn_down.0.weightF16[16384 6144]
-
blk.18.ffn_up.0.weightF16[6144 16384]
-
blk.18.ffn_gate.1.weightF16[6144 16384]
-
blk.18.ffn_gate_inp.weightF16[6144 8]
-
blk.18.attn_k.weightF16[6144 1024]
-
blk.18.attn_output.weightF16[6144 6144]
-
blk.18.attn_q.weightF16[6144 6144]
-
blk.18.attn_v.weightF16[6144 1024]
-
blk.18.ffn_down.1.weightF16[16384 6144]
-
blk.18.ffn_up.1.weightF16[6144 16384]
-
blk.18.ffn_gate.2.weightF16[6144 16384]
-
blk.18.ffn_down.2.weightF16[16384 6144]
-
blk.18.ffn_up.2.weightF16[6144 16384]
-
blk.18.ffn_gate.3.weightF16[6144 16384]
-
blk.18.ffn_down.3.weightF16[16384 6144]
-
blk.18.ffn_up.3.weightF16[6144 16384]
-
blk.18.ffn_gate.4.weightF16[6144 16384]
-
blk.18.ffn_down.4.weightF16[16384 6144]
-
blk.18.ffn_up.4.weightF16[6144 16384]
-
blk.18.ffn_gate.5.weightF16[6144 16384]
-
blk.18.ffn_down.5.weightF16[16384 6144]
-
blk.18.ffn_up.5.weightF16[6144 16384]
-
blk.18.ffn_gate.6.weightF16[6144 16384]
-
blk.18.ffn_down.6.weightF16[16384 6144]
-
blk.18.ffn_up.6.weightF16[6144 16384]
-
blk.18.ffn_gate.7.weightF16[6144 16384]
-
blk.18.ffn_down.7.weightF16[16384 6144]
-
blk.18.ffn_up.7.weightF16[6144 16384]
-
blk.18.attn_norm.weightF32[6144]
-
blk.18.ffn_norm.weightF32[6144]
-
blk.19.ffn_gate.0.weightF16[6144 16384]
-
blk.19.ffn_down.0.weightF16[16384 6144]
-
blk.19.ffn_up.0.weightF16[6144 16384]
-
blk.19.ffn_gate_inp.weightF16[6144 8]
-
blk.19.attn_k.weightF16[6144 1024]
-
blk.19.attn_output.weightF16[6144 6144]
-
blk.19.attn_q.weightF16[6144 6144]
-
blk.19.attn_v.weightF16[6144 1024]
-
blk.19.ffn_gate.1.weightF16[6144 16384]
-
blk.19.ffn_down.1.weightF16[16384 6144]
-
blk.19.ffn_up.1.weightF16[6144 16384]
-
blk.19.ffn_gate.2.weightF16[6144 16384]
-
blk.19.ffn_down.2.weightF16[16384 6144]
-
blk.19.ffn_up.2.weightF16[6144 16384]
-
blk.19.ffn_gate.3.weightF16[6144 16384]
-
blk.19.ffn_down.3.weightF16[16384 6144]
-
blk.19.ffn_up.3.weightF16[6144 16384]
-
blk.19.ffn_gate.4.weightF16[6144 16384]
-
blk.19.ffn_down.4.weightF16[16384 6144]
-
blk.19.ffn_up.4.weightF16[6144 16384]
-
blk.19.ffn_gate.5.weightF16[6144 16384]
-
blk.19.ffn_down.5.weightF16[16384 6144]
-
blk.19.ffn_up.5.weightF16[6144 16384]
-
blk.19.ffn_gate.6.weightF16[6144 16384]
-
blk.19.ffn_down.6.weightF16[16384 6144]
-
blk.19.ffn_up.6.weightF16[6144 16384]
-
blk.19.ffn_gate.7.weightF16[6144 16384]
-
blk.19.ffn_down.7.weightF16[16384 6144]
-
blk.19.ffn_up.7.weightF16[6144 16384]
-
blk.19.attn_norm.weightF32[6144]
-
blk.19.ffn_norm.weightF32[6144]
-
blk.20.ffn_gate.0.weightF16[6144 16384]
-
blk.20.ffn_down.0.weightF16[16384 6144]
-
blk.20.ffn_gate_inp.weightF16[6144 8]
-
blk.20.attn_k.weightF16[6144 1024]
-
blk.20.attn_output.weightF16[6144 6144]
-
blk.20.attn_q.weightF16[6144 6144]
-
blk.20.attn_v.weightF16[6144 1024]
-
blk.20.ffn_up.0.weightF16[6144 16384]
-
blk.20.ffn_gate.1.weightF16[6144 16384]
-
blk.20.ffn_down.1.weightF16[16384 6144]
-
blk.20.ffn_up.1.weightF16[6144 16384]
-
blk.20.ffn_gate.2.weightF16[6144 16384]
-
blk.20.ffn_down.2.weightF16[16384 6144]
-
blk.20.ffn_up.2.weightF16[6144 16384]
-
blk.20.ffn_gate.3.weightF16[6144 16384]
-
blk.20.ffn_down.3.weightF16[16384 6144]
-
blk.20.ffn_up.3.weightF16[6144 16384]
-
blk.20.ffn_gate.4.weightF16[6144 16384]
-
blk.20.ffn_down.4.weightF16[16384 6144]
-
blk.20.ffn_up.4.weightF16[6144 16384]
-
blk.20.ffn_gate.5.weightF16[6144 16384]
-
blk.20.ffn_down.5.weightF16[16384 6144]
-
blk.20.ffn_up.5.weightF16[6144 16384]
-
blk.20.ffn_gate.6.weightF16[6144 16384]
-
blk.20.ffn_down.6.weightF16[16384 6144]
-
blk.20.ffn_up.6.weightF16[6144 16384]
-
blk.20.ffn_gate.7.weightF16[6144 16384]
-
blk.20.ffn_down.7.weightF16[16384 6144]
-
blk.20.ffn_up.7.weightF16[6144 16384]
-
blk.20.attn_norm.weightF32[6144]
-
blk.20.ffn_norm.weightF32[6144]
-
blk.21.ffn_gate.0.weightF16[6144 16384]
-
blk.21.ffn_gate_inp.weightF16[6144 8]
-
blk.21.attn_k.weightF16[6144 1024]
-
blk.21.attn_output.weightF16[6144 6144]
-
blk.21.attn_q.weightF16[6144 6144]
-
blk.21.attn_v.weightF16[6144 1024]
-
blk.21.ffn_down.0.weightF16[16384 6144]
-
blk.21.ffn_up.0.weightF16[6144 16384]
-
blk.21.ffn_gate.1.weightF16[6144 16384]
-
blk.21.ffn_down.1.weightF16[16384 6144]
-
blk.21.ffn_up.1.weightF16[6144 16384]
-
blk.21.ffn_gate.2.weightF16[6144 16384]
-
blk.21.ffn_down.2.weightF16[16384 6144]
-
blk.21.ffn_up.2.weightF16[6144 16384]
-
blk.21.ffn_gate.3.weightF16[6144 16384]
-
blk.21.ffn_down.3.weightF16[16384 6144]
-
blk.21.ffn_up.3.weightF16[6144 16384]
-
blk.21.ffn_gate.4.weightF16[6144 16384]
-
blk.21.ffn_down.4.weightF16[16384 6144]
-
blk.21.ffn_up.4.weightF16[6144 16384]
-
blk.21.ffn_gate.5.weightF16[6144 16384]
-
blk.21.ffn_down.5.weightF16[16384 6144]
-
blk.21.ffn_up.5.weightF16[6144 16384]
-
blk.21.ffn_gate.6.weightF16[6144 16384]
-
blk.21.ffn_down.6.weightF16[16384 6144]
-
blk.21.ffn_up.6.weightF16[6144 16384]
-
blk.21.ffn_gate.7.weightF16[6144 16384]
-
blk.21.ffn_down.7.weightF16[16384 6144]
-
blk.21.ffn_up.7.weightF16[6144 16384]
-
blk.21.attn_norm.weightF32[6144]
-
blk.21.ffn_norm.weightF32[6144]
-
blk.22.ffn_gate_inp.weightF16[6144 8]
-
blk.22.attn_k.weightF16[6144 1024]
-
blk.22.attn_output.weightF16[6144 6144]
-
blk.22.attn_q.weightF16[6144 6144]
-
blk.22.attn_v.weightF16[6144 1024]
-
blk.22.ffn_gate.0.weightF16[6144 16384]
-
blk.22.ffn_down.0.weightF16[16384 6144]
-
blk.22.ffn_up.0.weightF16[6144 16384]
-
blk.22.ffn_gate.1.weightF16[6144 16384]
-
blk.22.ffn_down.1.weightF16[16384 6144]
-
blk.22.ffn_up.1.weightF16[6144 16384]
-
blk.22.ffn_gate.2.weightF16[6144 16384]
-
blk.22.ffn_down.2.weightF16[16384 6144]
-
blk.22.ffn_up.2.weightF16[6144 16384]
-
blk.22.ffn_gate.3.weightF16[6144 16384]
-
blk.22.ffn_down.3.weightF16[16384 6144]
-
blk.22.ffn_up.3.weightF16[6144 16384]
-
blk.22.ffn_gate.4.weightF16[6144 16384]
-
blk.22.ffn_down.4.weightF16[16384 6144]
-
blk.22.ffn_up.4.weightF16[6144 16384]
-
blk.22.ffn_gate.5.weightF16[6144 16384]
-
blk.22.ffn_down.5.weightF16[16384 6144]
-
blk.22.ffn_up.5.weightF16[6144 16384]
-
blk.22.ffn_gate.6.weightF16[6144 16384]
-
blk.22.ffn_down.6.weightF16[16384 6144]
-
blk.22.ffn_up.6.weightF16[6144 16384]
-
blk.22.ffn_gate.7.weightF16[6144 16384]
-
blk.22.ffn_down.7.weightF16[16384 6144]
-
blk.22.ffn_up.7.weightF16[6144 16384]
-
blk.22.attn_norm.weightF32[6144]
-
blk.22.ffn_norm.weightF32[6144]
-
blk.23.attn_k.weightF16[6144 1024]
-
blk.23.attn_q.weightF16[6144 6144]
-
blk.23.attn_v.weightF16[6144 1024]
-
blk.23.ffn_gate.0.weightF16[6144 16384]
-
blk.23.ffn_down.0.weightF16[16384 6144]
-
blk.23.ffn_up.0.weightF16[6144 16384]
-
blk.23.ffn_gate.1.weightF16[6144 16384]
-
blk.23.ffn_down.1.weightF16[16384 6144]
-
blk.23.ffn_up.1.weightF16[6144 16384]
-
blk.23.ffn_gate.2.weightF16[6144 16384]
-
blk.23.ffn_down.2.weightF16[16384 6144]
-
blk.23.ffn_up.2.weightF16[6144 16384]
-
blk.23.ffn_gate.3.weightF16[6144 16384]
-
blk.23.ffn_down.3.weightF16[16384 6144]
-
blk.23.ffn_up.3.weightF16[6144 16384]
-
blk.23.ffn_gate.4.weightF16[6144 16384]
-
blk.23.ffn_down.4.weightF16[16384 6144]
-
blk.23.ffn_up.4.weightF16[6144 16384]
-
blk.23.ffn_gate.5.weightF16[6144 16384]
-
blk.23.ffn_down.5.weightF16[16384 6144]
-
blk.23.ffn_up.5.weightF16[6144 16384]
-
blk.23.ffn_gate.6.weightF16[6144 16384]
-
blk.23.ffn_down.6.weightF16[16384 6144]
-
blk.23.ffn_up.6.weightF16[6144 16384]
-
blk.23.ffn_gate.7.weightF16[6144 16384]
-
blk.23.ffn_down.7.weightF16[16384 6144]
-
blk.23.ffn_up.7.weightF16[6144 16384]
-
blk.23.ffn_gate_inp.weightF16[6144 8]
-
blk.23.attn_norm.weightF32[6144]
-
blk.23.ffn_norm.weightF32[6144]
-
blk.23.attn_output.weightF16[6144 6144]
-
blk.24.attn_k.weightF16[6144 1024]
-
blk.24.attn_q.weightF16[6144 6144]
-
blk.24.ffn_gate.0.weightF16[6144 16384]
-
blk.24.ffn_down.0.weightF16[16384 6144]
-
blk.24.ffn_up.0.weightF16[6144 16384]
-
blk.24.ffn_gate.1.weightF16[6144 16384]
-
blk.24.ffn_down.1.weightF16[16384 6144]
-
blk.24.ffn_up.1.weightF16[6144 16384]
-
blk.24.ffn_gate.2.weightF16[6144 16384]
-
blk.24.ffn_down.2.weightF16[16384 6144]
-
blk.24.ffn_up.2.weightF16[6144 16384]
-
blk.24.ffn_gate.3.weightF16[6144 16384]
-
blk.24.ffn_down.3.weightF16[16384 6144]
-
blk.24.ffn_up.3.weightF16[6144 16384]
-
blk.24.ffn_gate.4.weightF16[6144 16384]
-
blk.24.ffn_down.4.weightF16[16384 6144]
-
blk.24.ffn_up.4.weightF16[6144 16384]
-
blk.24.ffn_gate.5.weightF16[6144 16384]
-
blk.24.ffn_down.5.weightF16[16384 6144]
-
blk.24.ffn_up.5.weightF16[6144 16384]
-
blk.24.ffn_gate.6.weightF16[6144 16384]
-
blk.24.ffn_down.6.weightF16[16384 6144]
-
blk.24.ffn_up.6.weightF16[6144 16384]
-
blk.24.ffn_gate.7.weightF16[6144 16384]
-
blk.24.ffn_down.7.weightF16[16384 6144]
-
blk.24.ffn_up.7.weightF16[6144 16384]
-
blk.24.ffn_gate_inp.weightF16[6144 8]
-
blk.24.attn_norm.weightF32[6144]
-
blk.24.ffn_norm.weightF32[6144]
-
blk.24.attn_output.weightF16[6144 6144]
-
blk.24.attn_v.weightF16[6144 1024]
-
blk.25.attn_q.weightF16[6144 6144]
-
blk.25.ffn_gate.0.weightF16[6144 16384]
-
blk.25.ffn_down.0.weightF16[16384 6144]
-
blk.25.ffn_up.0.weightF16[6144 16384]
-
blk.25.ffn_gate.1.weightF16[6144 16384]
-
blk.25.ffn_down.1.weightF16[16384 6144]
-
blk.25.ffn_up.1.weightF16[6144 16384]
-
blk.25.ffn_gate.2.weightF16[6144 16384]
-
blk.25.ffn_down.2.weightF16[16384 6144]
-
blk.25.ffn_up.2.weightF16[6144 16384]
-
blk.25.ffn_gate.3.weightF16[6144 16384]
-
blk.25.ffn_down.3.weightF16[16384 6144]
-
blk.25.ffn_up.3.weightF16[6144 16384]
-
blk.25.ffn_gate.4.weightF16[6144 16384]
-
blk.25.ffn_down.4.weightF16[16384 6144]
-
blk.25.ffn_up.4.weightF16[6144 16384]
-
blk.25.ffn_gate.5.weightF16[6144 16384]
-
blk.25.ffn_down.5.weightF16[16384 6144]
-
blk.25.ffn_up.5.weightF16[6144 16384]
-
blk.25.ffn_gate.6.weightF16[6144 16384]
-
blk.25.ffn_down.6.weightF16[16384 6144]
-
blk.25.ffn_up.6.weightF16[6144 16384]
-
blk.25.ffn_gate.7.weightF16[6144 16384]
-
blk.25.ffn_down.7.weightF16[16384 6144]
-
blk.25.ffn_up.7.weightF16[6144 16384]
-
blk.25.ffn_gate_inp.weightF16[6144 8]
-
blk.25.attn_norm.weightF32[6144]
-
blk.25.ffn_norm.weightF32[6144]
-
blk.25.attn_k.weightF16[6144 1024]
-
blk.25.attn_output.weightF16[6144 6144]
-
blk.25.attn_v.weightF16[6144 1024]
-
blk.26.ffn_gate.0.weightF16[6144 16384]
-
blk.26.ffn_down.0.weightF16[16384 6144]
-
blk.26.ffn_up.0.weightF16[6144 16384]
-
blk.26.ffn_gate.1.weightF16[6144 16384]
-
blk.26.ffn_down.1.weightF16[16384 6144]
-
blk.26.ffn_up.1.weightF16[6144 16384]
-
blk.26.ffn_gate.2.weightF16[6144 16384]
-
blk.26.ffn_down.2.weightF16[16384 6144]
-
blk.26.ffn_up.2.weightF16[6144 16384]
-
blk.26.ffn_gate.3.weightF16[6144 16384]
-
blk.26.ffn_down.3.weightF16[16384 6144]
-
blk.26.ffn_up.3.weightF16[6144 16384]
-
blk.26.ffn_gate.4.weightF16[6144 16384]
-
blk.26.ffn_down.4.weightF16[16384 6144]
-
blk.26.ffn_up.4.weightF16[6144 16384]
-
blk.26.ffn_gate.5.weightF16[6144 16384]
-
blk.26.ffn_down.5.weightF16[16384 6144]
-
blk.26.ffn_up.5.weightF16[6144 16384]
-
blk.26.ffn_gate.6.weightF16[6144 16384]
-
blk.26.ffn_down.6.weightF16[16384 6144]
-
blk.26.ffn_up.6.weightF16[6144 16384]
-
blk.26.ffn_gate.7.weightF16[6144 16384]
-
blk.26.ffn_down.7.weightF16[16384 6144]
-
blk.26.ffn_gate_inp.weightF16[6144 8]
-
blk.26.attn_k.weightF16[6144 1024]
-
blk.26.attn_output.weightF16[6144 6144]
-
blk.26.attn_q.weightF16[6144 6144]
-
blk.26.attn_v.weightF16[6144 1024]
-
blk.26.ffn_up.7.weightF16[6144 16384]
-
blk.26.attn_norm.weightF32[6144]
-
blk.26.ffn_norm.weightF32[6144]
-
blk.27.ffn_gate.0.weightF16[6144 16384]
-
blk.27.ffn_down.0.weightF16[16384 6144]
-
blk.27.ffn_up.0.weightF16[6144 16384]
-
blk.27.ffn_gate.1.weightF16[6144 16384]
-
blk.27.ffn_down.1.weightF16[16384 6144]
-
blk.27.ffn_up.1.weightF16[6144 16384]
-
blk.27.ffn_gate.2.weightF16[6144 16384]
-
blk.27.ffn_down.2.weightF16[16384 6144]
-
blk.27.ffn_up.2.weightF16[6144 16384]
-
blk.27.ffn_gate.3.weightF16[6144 16384]
-
blk.27.ffn_down.3.weightF16[16384 6144]
-
blk.27.ffn_up.3.weightF16[6144 16384]
-
blk.27.ffn_gate.4.weightF16[6144 16384]
-
blk.27.ffn_down.4.weightF16[16384 6144]
-
blk.27.ffn_up.4.weightF16[6144 16384]
-
blk.27.ffn_gate.5.weightF16[6144 16384]
-
blk.27.ffn_down.5.weightF16[16384 6144]
-
blk.27.ffn_up.5.weightF16[6144 16384]
-
blk.27.ffn_gate.6.weightF16[6144 16384]
-
blk.27.ffn_down.6.weightF16[16384 6144]
-
blk.27.ffn_up.6.weightF16[6144 16384]
-
blk.27.ffn_gate.7.weightF16[6144 16384]
-
blk.27.ffn_gate_inp.weightF16[6144 8]
-
blk.27.attn_k.weightF16[6144 1024]
-
blk.27.attn_output.weightF16[6144 6144]
-
blk.27.attn_q.weightF16[6144 6144]
-
blk.27.attn_v.weightF16[6144 1024]
-
blk.27.ffn_down.7.weightF16[16384 6144]
-
blk.27.ffn_up.7.weightF16[6144 16384]
-
blk.27.attn_norm.weightF32[6144]
-
blk.27.ffn_norm.weightF32[6144]
-
blk.28.ffn_gate.0.weightF16[6144 16384]
-
blk.28.ffn_down.0.weightF16[16384 6144]
-
blk.28.ffn_up.0.weightF16[6144 16384]
-
blk.28.ffn_gate.1.weightF16[6144 16384]
-
blk.28.ffn_down.1.weightF16[16384 6144]
-
blk.28.ffn_up.1.weightF16[6144 16384]
-
blk.28.ffn_gate.2.weightF16[6144 16384]
-
blk.28.ffn_down.2.weightF16[16384 6144]
-
blk.28.ffn_up.2.weightF16[6144 16384]
-
blk.28.ffn_gate.3.weightF16[6144 16384]
-
blk.28.ffn_down.3.weightF16[16384 6144]
-
blk.28.ffn_up.3.weightF16[6144 16384]
-
blk.28.ffn_gate.4.weightF16[6144 16384]
-
blk.28.ffn_down.4.weightF16[16384 6144]
-
blk.28.ffn_up.4.weightF16[6144 16384]
-
blk.28.ffn_gate.5.weightF16[6144 16384]
-
blk.28.ffn_down.5.weightF16[16384 6144]
-
blk.28.ffn_up.5.weightF16[6144 16384]
-
blk.28.ffn_gate.6.weightF16[6144 16384]
-
blk.28.ffn_down.6.weightF16[16384 6144]
-
blk.28.ffn_up.6.weightF16[6144 16384]
-
blk.28.ffn_gate_inp.weightF16[6144 8]
-
blk.28.attn_k.weightF16[6144 1024]
-
blk.28.attn_output.weightF16[6144 6144]
-
blk.28.attn_q.weightF16[6144 6144]
-
blk.28.attn_v.weightF16[6144 1024]
-
blk.28.ffn_gate.7.weightF16[6144 16384]
-
blk.28.ffn_down.7.weightF16[16384 6144]
-
blk.28.ffn_up.7.weightF16[6144 16384]
-
blk.28.attn_norm.weightF32[6144]
-
blk.28.ffn_norm.weightF32[6144]
-
blk.29.ffn_gate.0.weightF16[6144 16384]
-
blk.29.ffn_down.0.weightF16[16384 6144]
-
blk.29.ffn_up.0.weightF16[6144 16384]
-
blk.29.ffn_gate.1.weightF16[6144 16384]
-
blk.29.ffn_down.1.weightF16[16384 6144]
-
blk.29.ffn_up.1.weightF16[6144 16384]
-
blk.29.ffn_gate.2.weightF16[6144 16384]
-
blk.29.ffn_down.2.weightF16[16384 6144]
-
blk.29.ffn_up.2.weightF16[6144 16384]
-
blk.29.ffn_gate.3.weightF16[6144 16384]
-
blk.29.ffn_down.3.weightF16[16384 6144]
-
blk.29.ffn_up.3.weightF16[6144 16384]
-
blk.29.ffn_gate.4.weightF16[6144 16384]
-
blk.29.ffn_down.4.weightF16[16384 6144]
-
blk.29.ffn_up.4.weightF16[6144 16384]
-
blk.29.ffn_gate.5.weightF16[6144 16384]
-
blk.29.ffn_down.5.weightF16[16384 6144]
-
blk.29.ffn_up.5.weightF16[6144 16384]
-
blk.29.ffn_gate.6.weightF16[6144 16384]
-
blk.29.ffn_down.6.weightF16[16384 6144]
-
blk.29.ffn_gate_inp.weightF16[6144 8]
-
blk.29.attn_k.weightF16[6144 1024]
-
blk.29.attn_output.weightF16[6144 6144]
-
blk.29.attn_q.weightF16[6144 6144]
-
blk.29.attn_v.weightF16[6144 1024]
-
blk.29.ffn_up.6.weightF16[6144 16384]
-
blk.29.ffn_gate.7.weightF16[6144 16384]
-
blk.29.ffn_down.7.weightF16[16384 6144]
-
blk.29.ffn_up.7.weightF16[6144 16384]
-
blk.29.attn_norm.weightF32[6144]
-
blk.29.ffn_norm.weightF32[6144]
-
blk.30.ffn_gate.0.weightF16[6144 16384]
-
blk.30.ffn_down.0.weightF16[16384 6144]
-
blk.30.ffn_up.0.weightF16[6144 16384]
-
blk.30.ffn_gate.1.weightF16[6144 16384]
-
blk.30.ffn_down.1.weightF16[16384 6144]
-
blk.30.ffn_up.1.weightF16[6144 16384]
-
blk.30.ffn_gate.2.weightF16[6144 16384]
-
blk.30.ffn_down.2.weightF16[16384 6144]
-
blk.30.ffn_up.2.weightF16[6144 16384]
-
blk.30.ffn_gate.3.weightF16[6144 16384]
-
blk.30.ffn_down.3.weightF16[16384 6144]
-
blk.30.ffn_up.3.weightF16[6144 16384]
-
blk.30.ffn_gate.4.weightF16[6144 16384]
-
blk.30.ffn_down.4.weightF16[16384 6144]
-
blk.30.ffn_up.4.weightF16[6144 16384]
-
blk.30.ffn_gate.5.weightF16[6144 16384]
-
blk.30.ffn_down.5.weightF16[16384 6144]
-
blk.30.ffn_up.5.weightF16[6144 16384]
-
blk.30.ffn_gate.6.weightF16[6144 16384]
-
blk.30.ffn_gate_inp.weightF16[6144 8]
-
blk.30.attn_k.weightF16[6144 1024]
-
blk.30.attn_output.weightF16[6144 6144]
-
blk.30.attn_q.weightF16[6144 6144]
-
blk.30.attn_v.weightF16[6144 1024]
-
blk.30.ffn_down.6.weightF16[16384 6144]
-
blk.30.ffn_up.6.weightF16[6144 16384]
-
blk.30.ffn_gate.7.weightF16[6144 16384]
-
blk.30.ffn_down.7.weightF16[16384 6144]
-
blk.30.ffn_up.7.weightF16[6144 16384]
-
blk.30.attn_norm.weightF32[6144]
-
blk.30.ffn_norm.weightF32[6144]
-
blk.31.ffn_gate.0.weightF16[6144 16384]
-
blk.31.ffn_down.0.weightF16[16384 6144]
-
blk.31.ffn_up.0.weightF16[6144 16384]
-
blk.31.ffn_gate.1.weightF16[6144 16384]
-
blk.31.ffn_down.1.weightF16[16384 6144]
-
blk.31.ffn_up.1.weightF16[6144 16384]
-
blk.31.ffn_gate.2.weightF16[6144 16384]
-
blk.31.ffn_down.2.weightF16[16384 6144]
-
blk.31.ffn_up.2.weightF16[6144 16384]
-
blk.31.ffn_gate.3.weightF16[6144 16384]
-
blk.31.ffn_down.3.weightF16[16384 6144]
-
blk.31.ffn_up.3.weightF16[6144 16384]
-
blk.31.ffn_gate.4.weightF16[6144 16384]
-
blk.31.ffn_down.4.weightF16[16384 6144]
-
blk.31.ffn_up.4.weightF16[6144 16384]
-
blk.31.ffn_gate.5.weightF16[6144 16384]
-
blk.31.ffn_down.5.weightF16[16384 6144]
-
blk.31.ffn_up.5.weightF16[6144 16384]
-
blk.31.ffn_gate_inp.weightF16[6144 8]
-
blk.31.attn_k.weightF16[6144 1024]
-
blk.31.attn_output.weightF16[6144 6144]
-
blk.31.attn_q.weightF16[6144 6144]
-
blk.31.attn_v.weightF16[6144 1024]
-
blk.31.ffn_gate.6.weightF16[6144 16384]
-
blk.31.ffn_down.6.weightF16[16384 6144]
-
blk.31.ffn_up.6.weightF16[6144 16384]
-
blk.31.ffn_gate.7.weightF16[6144 16384]
-
blk.31.ffn_down.7.weightF16[16384 6144]
-
blk.31.ffn_up.7.weightF16[6144 16384]
-
blk.31.attn_norm.weightF32[6144]
-
blk.31.ffn_norm.weightF32[6144]
-
blk.32.ffn_gate.0.weightF16[6144 16384]
-
blk.32.ffn_down.0.weightF16[16384 6144]
-
blk.32.ffn_up.0.weightF16[6144 16384]
-
blk.32.ffn_gate.1.weightF16[6144 16384]
-
blk.32.ffn_down.1.weightF16[16384 6144]
-
blk.32.ffn_up.1.weightF16[6144 16384]
-
blk.32.ffn_gate.2.weightF16[6144 16384]
-
blk.32.ffn_down.2.weightF16[16384 6144]
-
blk.32.ffn_up.2.weightF16[6144 16384]
-
blk.32.ffn_gate.3.weightF16[6144 16384]
-
blk.32.ffn_down.3.weightF16[16384 6144]
-
blk.32.ffn_up.3.weightF16[6144 16384]
-
blk.32.ffn_gate.4.weightF16[6144 16384]
-
blk.32.ffn_down.4.weightF16[16384 6144]
-
blk.32.ffn_up.4.weightF16[6144 16384]
-
blk.32.ffn_gate.5.weightF16[6144 16384]
-
blk.32.ffn_down.5.weightF16[16384 6144]
-
blk.32.ffn_gate_inp.weightF16[6144 8]
-
blk.32.attn_k.weightF16[6144 1024]
-
blk.32.attn_output.weightF16[6144 6144]
-
blk.32.attn_q.weightF16[6144 6144]
-
blk.32.attn_v.weightF16[6144 1024]
-
blk.32.ffn_up.5.weightF16[6144 16384]
-
blk.32.ffn_gate.6.weightF16[6144 16384]
-
blk.32.ffn_down.6.weightF16[16384 6144]
-
blk.32.ffn_up.6.weightF16[6144 16384]
-
blk.32.ffn_gate.7.weightF16[6144 16384]
-
blk.32.ffn_down.7.weightF16[16384 6144]
-
blk.32.ffn_up.7.weightF16[6144 16384]
-
blk.32.attn_norm.weightF32[6144]
-
blk.32.ffn_norm.weightF32[6144]
-
blk.33.ffn_gate.0.weightF16[6144 16384]
-
blk.33.ffn_down.0.weightF16[16384 6144]
-
blk.33.ffn_up.0.weightF16[6144 16384]
-
blk.33.ffn_gate.1.weightF16[6144 16384]
-
blk.33.ffn_down.1.weightF16[16384 6144]
-
blk.33.ffn_up.1.weightF16[6144 16384]
-
blk.33.ffn_gate.2.weightF16[6144 16384]
-
blk.33.ffn_down.2.weightF16[16384 6144]
-
blk.33.ffn_up.2.weightF16[6144 16384]
-
blk.33.ffn_gate.3.weightF16[6144 16384]
-
blk.33.ffn_down.3.weightF16[16384 6144]
-
blk.33.ffn_up.3.weightF16[6144 16384]
-
blk.33.ffn_gate.4.weightF16[6144 16384]
-
blk.33.ffn_down.4.weightF16[16384 6144]
-
blk.33.ffn_up.4.weightF16[6144 16384]
-
blk.33.ffn_gate.5.weightF16[6144 16384]
-
blk.33.ffn_gate_inp.weightF16[6144 8]
-
blk.33.attn_k.weightF16[6144 1024]
-
blk.33.attn_output.weightF16[6144 6144]
-
blk.33.attn_q.weightF16[6144 6144]
-
blk.33.attn_v.weightF16[6144 1024]
-
blk.33.ffn_down.5.weightF16[16384 6144]
-
blk.33.ffn_up.5.weightF16[6144 16384]
-
blk.33.ffn_gate.6.weightF16[6144 16384]
-
blk.33.ffn_down.6.weightF16[16384 6144]
-
blk.33.ffn_up.6.weightF16[6144 16384]
-
blk.33.ffn_gate.7.weightF16[6144 16384]
-
blk.33.ffn_down.7.weightF16[16384 6144]
-
blk.33.ffn_up.7.weightF16[6144 16384]
-
blk.33.attn_norm.weightF32[6144]
-
blk.33.ffn_norm.weightF32[6144]
-
blk.34.ffn_gate.0.weightF16[6144 16384]
-
blk.34.ffn_down.0.weightF16[16384 6144]
-
blk.34.ffn_up.0.weightF16[6144 16384]
-
blk.34.ffn_gate.1.weightF16[6144 16384]
-
blk.34.ffn_down.1.weightF16[16384 6144]
-
blk.34.ffn_up.1.weightF16[6144 16384]
-
blk.34.ffn_gate.2.weightF16[6144 16384]
-
blk.34.ffn_down.2.weightF16[16384 6144]
-
blk.34.ffn_up.2.weightF16[6144 16384]
-
blk.34.ffn_gate.3.weightF16[6144 16384]
-
blk.34.ffn_down.3.weightF16[16384 6144]
-
blk.34.ffn_up.3.weightF16[6144 16384]
-
blk.34.ffn_gate.4.weightF16[6144 16384]
-
blk.34.ffn_down.4.weightF16[16384 6144]
-
blk.34.ffn_up.4.weightF16[6144 16384]
-
blk.34.ffn_gate_inp.weightF16[6144 8]
-
blk.34.attn_k.weightF16[6144 1024]
-
blk.34.attn_output.weightF16[6144 6144]
-
blk.34.attn_q.weightF16[6144 6144]
-
blk.34.attn_v.weightF16[6144 1024]
-
blk.34.ffn_gate.5.weightF16[6144 16384]
-
blk.34.ffn_down.5.weightF16[16384 6144]
-
blk.34.ffn_up.5.weightF16[6144 16384]
-
blk.34.ffn_gate.6.weightF16[6144 16384]
-
blk.34.ffn_down.6.weightF16[16384 6144]
-
blk.34.ffn_up.6.weightF16[6144 16384]
-
blk.34.ffn_gate.7.weightF16[6144 16384]
-
blk.34.ffn_down.7.weightF16[16384 6144]
-
blk.34.ffn_up.7.weightF16[6144 16384]
-
blk.34.attn_norm.weightF32[6144]
-
blk.34.ffn_norm.weightF32[6144]
-
blk.35.ffn_gate.0.weightF16[6144 16384]
-
blk.35.ffn_down.0.weightF16[16384 6144]
-
blk.35.ffn_up.0.weightF16[6144 16384]
-
blk.35.ffn_gate.1.weightF16[6144 16384]
-
blk.35.ffn_down.1.weightF16[16384 6144]
-
blk.35.ffn_up.1.weightF16[6144 16384]
-
blk.35.ffn_gate.2.weightF16[6144 16384]
-
blk.35.ffn_down.2.weightF16[16384 6144]
-
blk.35.ffn_up.2.weightF16[6144 16384]
-
blk.35.ffn_gate.3.weightF16[6144 16384]
-
blk.35.ffn_down.3.weightF16[16384 6144]
-
blk.35.ffn_up.3.weightF16[6144 16384]
-
blk.35.ffn_gate.4.weightF16[6144 16384]
-
blk.35.ffn_down.4.weightF16[16384 6144]
-
blk.35.ffn_gate_inp.weightF16[6144 8]
-
blk.35.attn_k.weightF16[6144 1024]
-
blk.35.attn_output.weightF16[6144 6144]
-
blk.35.attn_q.weightF16[6144 6144]
-
blk.35.attn_v.weightF16[6144 1024]
-
blk.35.ffn_up.4.weightF16[6144 16384]
-
blk.35.ffn_gate.5.weightF16[6144 16384]
-
blk.35.ffn_down.5.weightF16[16384 6144]
-
blk.35.ffn_up.5.weightF16[6144 16384]
-
blk.35.ffn_gate.6.weightF16[6144 16384]
-
blk.35.ffn_down.6.weightF16[16384 6144]
-
blk.35.ffn_up.6.weightF16[6144 16384]
-
blk.35.ffn_gate.7.weightF16[6144 16384]
-
blk.35.ffn_down.7.weightF16[16384 6144]
-
blk.35.ffn_up.7.weightF16[6144 16384]
-
blk.35.attn_norm.weightF32[6144]
-
blk.35.ffn_norm.weightF32[6144]
-
blk.36.ffn_gate.0.weightF16[6144 16384]
-
blk.36.ffn_down.0.weightF16[16384 6144]
-
blk.36.ffn_up.0.weightF16[6144 16384]
-
blk.36.ffn_gate.1.weightF16[6144 16384]
-
blk.36.ffn_down.1.weightF16[16384 6144]
-
blk.36.ffn_up.1.weightF16[6144 16384]
-
blk.36.ffn_gate.2.weightF16[6144 16384]
-
blk.36.ffn_down.2.weightF16[16384 6144]
-
blk.36.ffn_up.2.weightF16[6144 16384]
-
blk.36.ffn_gate.3.weightF16[6144 16384]
-
blk.36.ffn_down.3.weightF16[16384 6144]
-
blk.36.ffn_up.3.weightF16[6144 16384]
-
blk.36.ffn_gate.4.weightF16[6144 16384]
-
blk.36.ffn_gate_inp.weightF16[6144 8]
-
blk.36.attn_k.weightF16[6144 1024]
-
blk.36.attn_output.weightF16[6144 6144]
-
blk.36.attn_q.weightF16[6144 6144]
-
blk.36.attn_v.weightF16[6144 1024]
-
blk.36.ffn_down.4.weightF16[16384 6144]
-
blk.36.ffn_up.4.weightF16[6144 16384]
-
blk.36.ffn_gate.5.weightF16[6144 16384]
-
blk.36.ffn_down.5.weightF16[16384 6144]
-
blk.36.ffn_up.5.weightF16[6144 16384]
-
blk.36.ffn_gate.6.weightF16[6144 16384]
-
blk.36.ffn_down.6.weightF16[16384 6144]
-
blk.36.ffn_up.6.weightF16[6144 16384]
-
blk.36.ffn_gate.7.weightF16[6144 16384]
-
blk.36.ffn_down.7.weightF16[16384 6144]
-
blk.36.ffn_up.7.weightF16[6144 16384]
-
blk.36.attn_norm.weightF32[6144]
-
blk.36.ffn_norm.weightF32[6144]
-
blk.37.ffn_gate.0.weightF16[6144 16384]
-
blk.37.ffn_down.0.weightF16[16384 6144]
-
blk.37.ffn_up.0.weightF16[6144 16384]
-
blk.37.ffn_gate.1.weightF16[6144 16384]
-
blk.37.ffn_down.1.weightF16[16384 6144]
-
blk.37.ffn_up.1.weightF16[6144 16384]
-
blk.37.ffn_gate.2.weightF16[6144 16384]
-
blk.37.ffn_down.2.weightF16[16384 6144]
-
blk.37.ffn_up.2.weightF16[6144 16384]
-
blk.37.ffn_gate.3.weightF16[6144 16384]
-
blk.37.ffn_down.3.weightF16[16384 6144]
-
blk.37.ffn_up.3.weightF16[6144 16384]
-
blk.37.ffn_gate_inp.weightF16[6144 8]
-
blk.37.attn_k.weightF16[6144 1024]
-
blk.37.attn_output.weightF16[6144 6144]
-
blk.37.attn_q.weightF16[6144 6144]
-
blk.37.attn_v.weightF16[6144 1024]
-
blk.37.ffn_gate.4.weightF16[6144 16384]
-
blk.37.ffn_down.4.weightF16[16384 6144]
-
blk.37.ffn_up.4.weightF16[6144 16384]
-
blk.37.ffn_gate.5.weightF16[6144 16384]
-
blk.37.ffn_down.5.weightF16[16384 6144]
-
blk.37.ffn_up.5.weightF16[6144 16384]
-
blk.37.ffn_gate.6.weightF16[6144 16384]
-
blk.37.ffn_down.6.weightF16[16384 6144]
-
blk.37.ffn_up.6.weightF16[6144 16384]
-
blk.37.ffn_gate.7.weightF16[6144 16384]
-
blk.37.ffn_down.7.weightF16[16384 6144]
-
blk.37.ffn_up.7.weightF16[6144 16384]
-
blk.37.attn_norm.weightF32[6144]
-
blk.37.ffn_norm.weightF32[6144]
-
blk.38.ffn_gate.0.weightF16[6144 16384]
-
blk.38.ffn_down.0.weightF16[16384 6144]
-
blk.38.ffn_up.0.weightF16[6144 16384]
-
blk.38.ffn_gate.1.weightF16[6144 16384]
-
blk.38.ffn_down.1.weightF16[16384 6144]
-
blk.38.ffn_up.1.weightF16[6144 16384]
-
blk.38.ffn_gate.2.weightF16[6144 16384]
-
blk.38.ffn_down.2.weightF16[16384 6144]
-
blk.38.ffn_up.2.weightF16[6144 16384]
-
blk.38.ffn_gate.3.weightF16[6144 16384]
-
blk.38.ffn_down.3.weightF16[16384 6144]
-
blk.38.ffn_gate_inp.weightF16[6144 8]
-
blk.38.attn_k.weightF16[6144 1024]
-
blk.38.attn_output.weightF16[6144 6144]
-
blk.38.attn_q.weightF16[6144 6144]
-
blk.38.attn_v.weightF16[6144 1024]
-
blk.38.ffn_up.3.weightF16[6144 16384]
-
blk.38.ffn_gate.4.weightF16[6144 16384]
-
blk.38.ffn_down.4.weightF16[16384 6144]
-
blk.38.ffn_up.4.weightF16[6144 16384]
-
blk.38.ffn_gate.5.weightF16[6144 16384]
-
blk.38.ffn_down.5.weightF16[16384 6144]
-
blk.38.ffn_up.5.weightF16[6144 16384]
-
blk.38.ffn_gate.6.weightF16[6144 16384]
-
blk.38.ffn_down.6.weightF16[16384 6144]
-
blk.38.ffn_up.6.weightF16[6144 16384]
-
blk.38.ffn_gate.7.weightF16[6144 16384]
-
blk.38.ffn_down.7.weightF16[16384 6144]
-
blk.38.ffn_up.7.weightF16[6144 16384]
-
blk.38.attn_norm.weightF32[6144]
-
blk.38.ffn_norm.weightF32[6144]
-
blk.39.ffn_gate.0.weightF16[6144 16384]
-
blk.39.ffn_down.0.weightF16[16384 6144]
-
blk.39.ffn_up.0.weightF16[6144 16384]
-
blk.39.ffn_gate.1.weightF16[6144 16384]
-
blk.39.ffn_down.1.weightF16[16384 6144]
-
blk.39.ffn_up.1.weightF16[6144 16384]
-
blk.39.ffn_gate.2.weightF16[6144 16384]
-
blk.39.ffn_down.2.weightF16[16384 6144]
-
blk.39.ffn_up.2.weightF16[6144 16384]
-
blk.39.ffn_gate.3.weightF16[6144 16384]
-
blk.39.ffn_gate_inp.weightF16[6144 8]
-
blk.39.attn_k.weightF16[6144 1024]
-
blk.39.attn_output.weightF16[6144 6144]
-
blk.39.attn_q.weightF16[6144 6144]
-
blk.39.attn_v.weightF16[6144 1024]
-
blk.39.ffn_down.3.weightF16[16384 6144]
-
blk.39.ffn_up.3.weightF16[6144 16384]
-
blk.39.ffn_gate.4.weightF16[6144 16384]
-
blk.39.ffn_down.4.weightF16[16384 6144]
-
blk.39.ffn_up.4.weightF16[6144 16384]
-
blk.39.ffn_gate.5.weightF16[6144 16384]
-
blk.39.ffn_down.5.weightF16[16384 6144]
-
blk.39.ffn_up.5.weightF16[6144 16384]
-
blk.39.ffn_gate.6.weightF16[6144 16384]
-
blk.39.ffn_down.6.weightF16[16384 6144]
-
blk.39.ffn_up.6.weightF16[6144 16384]
-
blk.39.ffn_gate.7.weightF16[6144 16384]
-
blk.39.ffn_down.7.weightF16[16384 6144]
-
blk.39.ffn_up.7.weightF16[6144 16384]
-
blk.39.attn_norm.weightF32[6144]
-
blk.39.ffn_norm.weightF32[6144]
-
blk.40.ffn_gate.0.weightF16[6144 16384]
-
blk.40.ffn_down.0.weightF16[16384 6144]
-
blk.40.ffn_up.0.weightF16[6144 16384]
-
blk.40.ffn_gate.1.weightF16[6144 16384]
-
blk.40.ffn_down.1.weightF16[16384 6144]
-
blk.40.ffn_up.1.weightF16[6144 16384]
-
blk.40.ffn_gate.2.weightF16[6144 16384]
-
blk.40.ffn_down.2.weightF16[16384 6144]
-
blk.40.ffn_up.2.weightF16[6144 16384]
-
blk.40.ffn_gate_inp.weightF16[6144 8]
-
blk.40.attn_k.weightF16[6144 1024]
-
blk.40.attn_output.weightF16[6144 6144]
-
blk.40.attn_q.weightF16[6144 6144]
-
blk.40.attn_v.weightF16[6144 1024]
-
blk.40.ffn_gate.3.weightF16[6144 16384]
-
blk.40.ffn_down.3.weightF16[16384 6144]
-
blk.40.ffn_up.3.weightF16[6144 16384]
-
blk.40.ffn_gate.4.weightF16[6144 16384]
-
blk.40.ffn_down.4.weightF16[16384 6144]
-
blk.40.ffn_up.4.weightF16[6144 16384]
-
blk.40.ffn_gate.5.weightF16[6144 16384]
-
blk.40.ffn_down.5.weightF16[16384 6144]
-
blk.40.ffn_up.5.weightF16[6144 16384]
-
blk.40.ffn_gate.6.weightF16[6144 16384]
-
blk.40.ffn_down.6.weightF16[16384 6144]
-
blk.40.ffn_up.6.weightF16[6144 16384]
-
blk.40.ffn_gate.7.weightF16[6144 16384]
-
blk.40.ffn_down.7.weightF16[16384 6144]
-
blk.40.ffn_up.7.weightF16[6144 16384]
-
blk.40.attn_norm.weightF32[6144]
-
blk.40.ffn_norm.weightF32[6144]
-
blk.41.ffn_gate.0.weightF16[6144 16384]
-
blk.41.ffn_down.0.weightF16[16384 6144]
-
blk.41.ffn_up.0.weightF16[6144 16384]
-
blk.41.ffn_gate.1.weightF16[6144 16384]
-
blk.41.ffn_down.1.weightF16[16384 6144]
-
blk.41.ffn_up.1.weightF16[6144 16384]
-
blk.41.ffn_gate.2.weightF16[6144 16384]
-
blk.41.ffn_down.2.weightF16[16384 6144]
-
blk.41.ffn_gate_inp.weightF16[6144 8]
-
blk.41.attn_k.weightF16[6144 1024]
-
blk.41.attn_output.weightF16[6144 6144]
-
blk.41.attn_q.weightF16[6144 6144]
-
blk.41.attn_v.weightF16[6144 1024]
-
blk.41.ffn_up.2.weightF16[6144 16384]
-
blk.41.ffn_gate.3.weightF16[6144 16384]
-
blk.41.ffn_down.3.weightF16[16384 6144]
-
blk.41.ffn_up.3.weightF16[6144 16384]
-
blk.41.ffn_gate.4.weightF16[6144 16384]
-
blk.41.ffn_down.4.weightF16[16384 6144]
-
blk.41.ffn_up.4.weightF16[6144 16384]
-
blk.41.ffn_gate.5.weightF16[6144 16384]
-
blk.41.ffn_down.5.weightF16[16384 6144]
-
blk.41.ffn_up.5.weightF16[6144 16384]
-
blk.41.ffn_gate.6.weightF16[6144 16384]
-
blk.41.ffn_down.6.weightF16[16384 6144]
-
blk.41.ffn_up.6.weightF16[6144 16384]
-
blk.41.ffn_gate.7.weightF16[6144 16384]
-
blk.41.ffn_down.7.weightF16[16384 6144]
-
blk.41.ffn_up.7.weightF16[6144 16384]
-
blk.41.attn_norm.weightF32[6144]
-
blk.41.ffn_norm.weightF32[6144]
-
blk.42.ffn_gate.0.weightF16[6144 16384]
-
blk.42.ffn_down.0.weightF16[16384 6144]
-
blk.42.ffn_up.0.weightF16[6144 16384]
-
blk.42.ffn_gate.1.weightF16[6144 16384]
-
blk.42.ffn_down.1.weightF16[16384 6144]
-
blk.42.ffn_up.1.weightF16[6144 16384]
-
blk.42.ffn_gate.2.weightF16[6144 16384]
-
blk.42.ffn_gate_inp.weightF16[6144 8]
-
blk.42.attn_k.weightF16[6144 1024]
-
blk.42.attn_output.weightF16[6144 6144]
-
blk.42.attn_q.weightF16[6144 6144]
-
blk.42.attn_v.weightF16[6144 1024]
-
blk.42.ffn_down.2.weightF16[16384 6144]
-
blk.42.ffn_up.2.weightF16[6144 16384]
-
blk.42.ffn_gate.3.weightF16[6144 16384]
-
blk.42.ffn_down.3.weightF16[16384 6144]
-
blk.42.ffn_up.3.weightF16[6144 16384]
-
blk.42.ffn_gate.4.weightF16[6144 16384]
-
blk.42.ffn_down.4.weightF16[16384 6144]
-
blk.42.ffn_up.4.weightF16[6144 16384]
-
blk.42.ffn_gate.5.weightF16[6144 16384]
-
blk.42.ffn_down.5.weightF16[16384 6144]
-
blk.42.ffn_up.5.weightF16[6144 16384]
-
blk.42.ffn_gate.6.weightF16[6144 16384]
-
blk.42.ffn_down.6.weightF16[16384 6144]
-
blk.42.ffn_up.6.weightF16[6144 16384]
-
blk.42.ffn_gate.7.weightF16[6144 16384]
-
blk.42.ffn_down.7.weightF16[16384 6144]
-
blk.42.ffn_up.7.weightF16[6144 16384]
-
blk.42.attn_norm.weightF32[6144]
-
blk.42.ffn_norm.weightF32[6144]
-
blk.43.ffn_gate.0.weightF16[6144 16384]
-
blk.43.ffn_down.0.weightF16[16384 6144]
-
blk.43.ffn_up.0.weightF16[6144 16384]
-
blk.43.ffn_gate.1.weightF16[6144 16384]
-
blk.43.ffn_down.1.weightF16[16384 6144]
-
blk.43.ffn_up.1.weightF16[6144 16384]
-
blk.43.ffn_gate_inp.weightF16[6144 8]
-
blk.43.attn_k.weightF16[6144 1024]
-
blk.43.attn_output.weightF16[6144 6144]
-
blk.43.attn_q.weightF16[6144 6144]
-
blk.43.attn_v.weightF16[6144 1024]
-
blk.43.ffn_gate.2.weightF16[6144 16384]
-
blk.43.ffn_down.2.weightF16[16384 6144]
-
blk.43.ffn_up.2.weightF16[6144 16384]
-
blk.43.ffn_gate.3.weightF16[6144 16384]
-
blk.43.ffn_down.3.weightF16[16384 6144]
-
blk.43.ffn_up.3.weightF16[6144 16384]
-
blk.43.ffn_gate.4.weightF16[6144 16384]
-
blk.43.ffn_down.4.weightF16[16384 6144]
-
blk.43.ffn_up.4.weightF16[6144 16384]
-
blk.43.ffn_gate.5.weightF16[6144 16384]
-
blk.43.ffn_down.5.weightF16[16384 6144]
-
blk.43.ffn_up.5.weightF16[6144 16384]
-
blk.43.ffn_gate.6.weightF16[6144 16384]
-
blk.43.ffn_down.6.weightF16[16384 6144]
-
blk.43.ffn_up.6.weightF16[6144 16384]
-
blk.43.ffn_gate.7.weightF16[6144 16384]
-
blk.43.ffn_down.7.weightF16[16384 6144]
-
blk.43.ffn_up.7.weightF16[6144 16384]
-
blk.43.attn_norm.weightF32[6144]
-
blk.43.ffn_norm.weightF32[6144]
-
blk.44.ffn_gate.0.weightF16[6144 16384]
-
blk.44.ffn_down.0.weightF16[16384 6144]
-
blk.44.ffn_up.0.weightF16[6144 16384]
-
blk.44.ffn_gate.1.weightF16[6144 16384]
-
blk.44.ffn_down.1.weightF16[16384 6144]
-
blk.44.ffn_gate_inp.weightF16[6144 8]
-
blk.44.attn_k.weightF16[6144 1024]
-
blk.44.attn_output.weightF16[6144 6144]
-
blk.44.attn_q.weightF16[6144 6144]
-
blk.44.attn_v.weightF16[6144 1024]
-
blk.44.ffn_up.1.weightF16[6144 16384]
-
blk.44.ffn_gate.2.weightF16[6144 16384]
-
blk.44.ffn_down.2.weightF16[16384 6144]
-
blk.44.ffn_up.2.weightF16[6144 16384]
-
blk.44.ffn_gate.3.weightF16[6144 16384]
-
blk.44.ffn_down.3.weightF16[16384 6144]
-
blk.44.ffn_up.3.weightF16[6144 16384]
-
blk.44.ffn_gate.4.weightF16[6144 16384]
-
blk.44.ffn_down.4.weightF16[16384 6144]
-
blk.44.ffn_up.4.weightF16[6144 16384]
-
blk.44.ffn_gate.5.weightF16[6144 16384]
-
blk.44.ffn_down.5.weightF16[16384 6144]
-
blk.44.ffn_up.5.weightF16[6144 16384]
-
blk.44.ffn_gate.6.weightF16[6144 16384]
-
blk.44.ffn_down.6.weightF16[16384 6144]
-
blk.44.ffn_up.6.weightF16[6144 16384]
-
blk.44.ffn_gate.7.weightF16[6144 16384]
-
blk.44.ffn_down.7.weightF16[16384 6144]
-
blk.44.ffn_up.7.weightF16[6144 16384]
-
blk.44.attn_norm.weightF32[6144]
-
blk.44.ffn_norm.weightF32[6144]
-
blk.45.ffn_gate.0.weightF16[6144 16384]
-
blk.45.ffn_down.0.weightF16[16384 6144]
-
blk.45.ffn_up.0.weightF16[6144 16384]
-
blk.45.ffn_gate.1.weightF16[6144 16384]
-
blk.45.ffn_gate_inp.weightF16[6144 8]
-
blk.45.attn_k.weightF16[6144 1024]
-
blk.45.attn_output.weightF16[6144 6144]
-
blk.45.attn_q.weightF16[6144 6144]
-
blk.45.attn_v.weightF16[6144 1024]
-
blk.45.ffn_down.1.weightF16[16384 6144]
-
blk.45.ffn_up.1.weightF16[6144 16384]
-
blk.45.ffn_gate.2.weightF16[6144 16384]
-
blk.45.ffn_down.2.weightF16[16384 6144]
-
blk.45.ffn_up.2.weightF16[6144 16384]
-
blk.45.ffn_gate.3.weightF16[6144 16384]
-
blk.45.ffn_down.3.weightF16[16384 6144]
-
blk.45.ffn_up.3.weightF16[6144 16384]
-
blk.45.ffn_gate.4.weightF16[6144 16384]
-
blk.45.ffn_down.4.weightF16[16384 6144]
-
blk.45.ffn_up.4.weightF16[6144 16384]
-
blk.45.ffn_gate.5.weightF16[6144 16384]
-
blk.45.ffn_down.5.weightF16[16384 6144]
-
blk.45.ffn_up.5.weightF16[6144 16384]
-
blk.45.ffn_gate.6.weightF16[6144 16384]
-
blk.45.ffn_down.6.weightF16[16384 6144]
-
blk.45.ffn_up.6.weightF16[6144 16384]
-
blk.45.ffn_gate.7.weightF16[6144 16384]
-
blk.45.ffn_down.7.weightF16[16384 6144]
-
blk.45.ffn_up.7.weightF16[6144 16384]
-
blk.45.attn_norm.weightF32[6144]
-
blk.45.ffn_norm.weightF32[6144]
-
blk.46.ffn_gate.0.weightF16[6144 16384]
-
blk.46.ffn_down.0.weightF16[16384 6144]
-
blk.46.ffn_up.0.weightF16[6144 16384]
-
blk.46.ffn_gate_inp.weightF16[6144 8]
-
blk.46.attn_k.weightF16[6144 1024]
-
blk.46.attn_output.weightF16[6144 6144]
-
blk.46.attn_q.weightF16[6144 6144]
-
blk.46.attn_v.weightF16[6144 1024]
-
blk.46.ffn_gate.1.weightF16[6144 16384]
-
blk.46.ffn_down.1.weightF16[16384 6144]
-
blk.46.ffn_up.1.weightF16[6144 16384]
-
blk.46.ffn_gate.2.weightF16[6144 16384]
-
blk.46.ffn_down.2.weightF16[16384 6144]
-
blk.46.ffn_up.2.weightF16[6144 16384]
-
blk.46.ffn_gate.3.weightF16[6144 16384]
-
blk.46.ffn_down.3.weightF16[16384 6144]
-
blk.46.ffn_up.3.weightF16[6144 16384]
-
blk.46.ffn_gate.4.weightF16[6144 16384]
-
blk.46.ffn_down.4.weightF16[16384 6144]
-
blk.46.ffn_up.4.weightF16[6144 16384]
-
blk.46.ffn_gate.5.weightF16[6144 16384]
-
blk.46.ffn_down.5.weightF16[16384 6144]
-
blk.46.ffn_up.5.weightF16[6144 16384]
-
blk.46.ffn_gate.6.weightF16[6144 16384]
-
blk.46.ffn_down.6.weightF16[16384 6144]
-
blk.46.ffn_up.6.weightF16[6144 16384]
-
blk.46.ffn_gate.7.weightF16[6144 16384]
-
blk.46.ffn_down.7.weightF16[16384 6144]
-
blk.46.ffn_up.7.weightF16[6144 16384]
-
blk.46.attn_norm.weightF32[6144]
-
blk.46.ffn_norm.weightF32[6144]
-
blk.47.ffn_gate.0.weightF16[6144 16384]
-
blk.47.ffn_down.0.weightF16[16384 6144]
-
blk.47.ffn_gate_inp.weightF16[6144 8]
-
blk.47.attn_k.weightF16[6144 1024]
-
blk.47.attn_output.weightF16[6144 6144]
-
blk.47.attn_q.weightF16[6144 6144]
-
blk.47.attn_v.weightF16[6144 1024]
-
blk.47.ffn_up.0.weightF16[6144 16384]
-
blk.47.ffn_gate.1.weightF16[6144 16384]
-
blk.47.ffn_down.1.weightF16[16384 6144]
-
blk.47.ffn_up.1.weightF16[6144 16384]
-
blk.47.ffn_gate.2.weightF16[6144 16384]
-
blk.47.ffn_down.2.weightF16[16384 6144]
-
blk.47.ffn_up.2.weightF16[6144 16384]
-
blk.47.ffn_gate.3.weightF16[6144 16384]
-
blk.47.ffn_down.3.weightF16[16384 6144]
-
blk.47.ffn_up.3.weightF16[6144 16384]
-
blk.47.ffn_gate.4.weightF16[6144 16384]
-
blk.47.ffn_down.4.weightF16[16384 6144]
-
blk.47.ffn_up.4.weightF16[6144 16384]
-
blk.47.ffn_gate.5.weightF16[6144 16384]
-
blk.47.ffn_down.5.weightF16[16384 6144]
-
blk.47.ffn_up.5.weightF16[6144 16384]
-
blk.47.ffn_gate.6.weightF16[6144 16384]
-
blk.47.ffn_down.6.weightF16[16384 6144]
-
blk.47.ffn_up.6.weightF16[6144 16384]
-
blk.47.ffn_gate.7.weightF16[6144 16384]
-
blk.47.ffn_down.7.weightF16[16384 6144]
-
blk.47.ffn_up.7.weightF16[6144 16384]
-
blk.47.attn_norm.weightF32[6144]
-
blk.47.ffn_norm.weightF32[6144]
-
blk.48.ffn_gate.0.weightF16[6144 16384]
-
blk.48.ffn_gate_inp.weightF16[6144 8]
-
blk.48.attn_k.weightF16[6144 1024]
-
blk.48.attn_output.weightF16[6144 6144]
-
blk.48.attn_q.weightF16[6144 6144]
-
blk.48.attn_v.weightF16[6144 1024]
-
blk.48.ffn_down.0.weightF16[16384 6144]
-
blk.48.ffn_up.0.weightF16[6144 16384]
-
blk.48.ffn_gate.1.weightF16[6144 16384]
-
blk.48.ffn_down.1.weightF16[16384 6144]
-
blk.48.ffn_up.1.weightF16[6144 16384]
-
blk.48.ffn_gate.2.weightF16[6144 16384]
-
blk.48.ffn_down.2.weightF16[16384 6144]
-
blk.48.ffn_up.2.weightF16[6144 16384]
-
blk.48.ffn_gate.3.weightF16[6144 16384]
-
blk.48.ffn_down.3.weightF16[16384 6144]
-
blk.48.ffn_up.3.weightF16[6144 16384]
-
blk.48.ffn_gate.4.weightF16[6144 16384]
-
blk.48.ffn_down.4.weightF16[16384 6144]
-
blk.48.ffn_up.4.weightF16[6144 16384]
-
blk.48.ffn_gate.5.weightF16[6144 16384]
-
blk.48.ffn_down.5.weightF16[16384 6144]
-
blk.48.ffn_up.5.weightF16[6144 16384]
-
blk.48.ffn_gate.6.weightF16[6144 16384]
-
blk.48.ffn_down.6.weightF16[16384 6144]
-
blk.48.ffn_up.6.weightF16[6144 16384]
-
blk.48.ffn_gate.7.weightF16[6144 16384]
-
blk.48.ffn_down.7.weightF16[16384 6144]
-
blk.48.ffn_up.7.weightF16[6144 16384]
-
blk.48.attn_norm.weightF32[6144]
-
blk.48.ffn_norm.weightF32[6144]
-
blk.49.ffn_gate_inp.weightF16[6144 8]
-
blk.49.attn_k.weightF16[6144 1024]
-
blk.49.attn_output.weightF16[6144 6144]
-
blk.49.attn_q.weightF16[6144 6144]
-
blk.49.attn_v.weightF16[6144 1024]
-
blk.49.ffn_gate.0.weightF16[6144 16384]
-
blk.49.ffn_down.0.weightF16[16384 6144]
-
blk.49.ffn_up.0.weightF16[6144 16384]
-
blk.49.ffn_gate.1.weightF16[6144 16384]
-
blk.49.ffn_down.1.weightF16[16384 6144]
-
blk.49.ffn_up.1.weightF16[6144 16384]
-
blk.49.ffn_gate.2.weightF16[6144 16384]
-
blk.49.ffn_down.2.weightF16[16384 6144]
-
blk.49.ffn_up.2.weightF16[6144 16384]
-
blk.49.ffn_gate.3.weightF16[6144 16384]
-
blk.49.ffn_down.3.weightF16[16384 6144]
-
blk.49.ffn_up.3.weightF16[6144 16384]
-
blk.49.ffn_gate.4.weightF16[6144 16384]
-
blk.49.ffn_down.4.weightF16[16384 6144]
-
blk.49.ffn_up.4.weightF16[6144 16384]
-
blk.49.ffn_gate.5.weightF16[6144 16384]
-
blk.49.ffn_down.5.weightF16[16384 6144]
-
blk.49.ffn_up.5.weightF16[6144 16384]
-
blk.49.ffn_gate.6.weightF16[6144 16384]
-
blk.49.ffn_down.6.weightF16[16384 6144]
-
blk.49.ffn_up.6.weightF16[6144 16384]
-
blk.49.ffn_gate.7.weightF16[6144 16384]
-
blk.49.ffn_down.7.weightF16[16384 6144]
-
blk.49.ffn_up.7.weightF16[6144 16384]
-
blk.49.attn_norm.weightF32[6144]
-
blk.49.ffn_norm.weightF32[6144]
-
blk.50.attn_k.weightF16[6144 1024]
-
blk.50.attn_q.weightF16[6144 6144]
-
blk.50.attn_v.weightF16[6144 1024]
-
blk.50.ffn_gate.0.weightF16[6144 16384]
-
blk.50.ffn_down.0.weightF16[16384 6144]
-
blk.50.ffn_up.0.weightF16[6144 16384]
-
blk.50.ffn_gate.1.weightF16[6144 16384]
-
blk.50.ffn_down.1.weightF16[16384 6144]
-
blk.50.ffn_up.1.weightF16[6144 16384]
-
blk.50.ffn_gate.2.weightF16[6144 16384]
-
blk.50.ffn_down.2.weightF16[16384 6144]
-
blk.50.ffn_up.2.weightF16[6144 16384]
-
blk.50.ffn_gate.3.weightF16[6144 16384]
-
blk.50.ffn_down.3.weightF16[16384 6144]
-
blk.50.ffn_up.3.weightF16[6144 16384]
-
blk.50.ffn_gate.4.weightF16[6144 16384]
-
blk.50.ffn_down.4.weightF16[16384 6144]
-
blk.50.ffn_up.4.weightF16[6144 16384]
-
blk.50.ffn_gate.5.weightF16[6144 16384]
-
blk.50.ffn_down.5.weightF16[16384 6144]
-
blk.50.ffn_up.5.weightF16[6144 16384]
-
blk.50.ffn_gate.6.weightF16[6144 16384]
-
blk.50.ffn_down.6.weightF16[16384 6144]
-
blk.50.ffn_up.6.weightF16[6144 16384]
-
blk.50.ffn_gate.7.weightF16[6144 16384]
-
blk.50.ffn_down.7.weightF16[16384 6144]
-
blk.50.ffn_up.7.weightF16[6144 16384]
-
blk.50.ffn_gate_inp.weightF16[6144 8]
-
blk.50.attn_norm.weightF32[6144]
-
blk.50.ffn_norm.weightF32[6144]
-
blk.50.attn_output.weightF16[6144 6144]
-
blk.51.attn_k.weightF16[6144 1024]
-
blk.51.attn_q.weightF16[6144 6144]
-
blk.51.ffn_gate.0.weightF16[6144 16384]
-
blk.51.ffn_down.0.weightF16[16384 6144]
-
blk.51.ffn_up.0.weightF16[6144 16384]
-
blk.51.ffn_gate.1.weightF16[6144 16384]
-
blk.51.ffn_down.1.weightF16[16384 6144]
-
blk.51.ffn_up.1.weightF16[6144 16384]
-
blk.51.ffn_gate.2.weightF16[6144 16384]
-
blk.51.ffn_down.2.weightF16[16384 6144]
-
blk.51.ffn_up.2.weightF16[6144 16384]
-
blk.51.ffn_gate.3.weightF16[6144 16384]
-
blk.51.ffn_down.3.weightF16[16384 6144]
-
blk.51.ffn_up.3.weightF16[6144 16384]
-
blk.51.ffn_gate.4.weightF16[6144 16384]
-
blk.51.ffn_down.4.weightF16[16384 6144]
-
blk.51.ffn_up.4.weightF16[6144 16384]
-
blk.51.ffn_gate.5.weightF16[6144 16384]
-
blk.51.ffn_down.5.weightF16[16384 6144]
-
blk.51.ffn_up.5.weightF16[6144 16384]
-
blk.51.ffn_gate.6.weightF16[6144 16384]
-
blk.51.ffn_down.6.weightF16[16384 6144]
-
blk.51.ffn_up.6.weightF16[6144 16384]
-
blk.51.ffn_gate.7.weightF16[6144 16384]
-
blk.51.ffn_down.7.weightF16[16384 6144]
-
blk.51.ffn_up.7.weightF16[6144 16384]
-
blk.51.ffn_gate_inp.weightF16[6144 8]
-
blk.51.attn_norm.weightF32[6144]
-
blk.51.ffn_norm.weightF32[6144]
-
blk.51.attn_output.weightF16[6144 6144]
-
blk.51.attn_v.weightF16[6144 1024]
-
blk.52.attn_q.weightF16[6144 6144]
-
blk.52.ffn_gate.0.weightF16[6144 16384]
-
blk.52.ffn_down.0.weightF16[16384 6144]
-
blk.52.ffn_up.0.weightF16[6144 16384]
-
blk.52.ffn_gate.1.weightF16[6144 16384]
-
blk.52.ffn_down.1.weightF16[16384 6144]
-
blk.52.ffn_up.1.weightF16[6144 16384]
-
blk.52.ffn_gate.2.weightF16[6144 16384]
-
blk.52.ffn_down.2.weightF16[16384 6144]
-
blk.52.ffn_up.2.weightF16[6144 16384]
-
blk.52.ffn_gate.3.weightF16[6144 16384]
-
blk.52.ffn_down.3.weightF16[16384 6144]
-
blk.52.ffn_up.3.weightF16[6144 16384]
-
blk.52.ffn_gate.4.weightF16[6144 16384]
-
blk.52.ffn_down.4.weightF16[16384 6144]
-
blk.52.ffn_up.4.weightF16[6144 16384]
-
blk.52.ffn_gate.5.weightF16[6144 16384]
-
blk.52.ffn_down.5.weightF16[16384 6144]
-
blk.52.ffn_up.5.weightF16[6144 16384]
-
blk.52.ffn_gate.6.weightF16[6144 16384]
-
blk.52.ffn_down.6.weightF16[16384 6144]
-
blk.52.ffn_up.6.weightF16[6144 16384]
-
blk.52.ffn_gate.7.weightF16[6144 16384]
-
blk.52.ffn_down.7.weightF16[16384 6144]
-
blk.52.ffn_up.7.weightF16[6144 16384]
-
blk.52.ffn_gate_inp.weightF16[6144 8]
-
blk.52.attn_norm.weightF32[6144]
-
blk.52.ffn_norm.weightF32[6144]
-
blk.52.attn_k.weightF16[6144 1024]
-
blk.52.attn_output.weightF16[6144 6144]
-
blk.52.attn_v.weightF16[6144 1024]
-
blk.53.ffn_gate.0.weightF16[6144 16384]
-
blk.53.ffn_down.0.weightF16[16384 6144]
-
blk.53.ffn_up.0.weightF16[6144 16384]
-
blk.53.ffn_gate.1.weightF16[6144 16384]
-
blk.53.ffn_down.1.weightF16[16384 6144]
-
blk.53.ffn_up.1.weightF16[6144 16384]
-
blk.53.ffn_gate.2.weightF16[6144 16384]
-
blk.53.ffn_down.2.weightF16[16384 6144]
-
blk.53.ffn_up.2.weightF16[6144 16384]
-
blk.53.ffn_gate.3.weightF16[6144 16384]
-
blk.53.ffn_down.3.weightF16[16384 6144]
-
blk.53.ffn_up.3.weightF16[6144 16384]
-
blk.53.ffn_gate.4.weightF16[6144 16384]
-
blk.53.ffn_down.4.weightF16[16384 6144]
-
blk.53.ffn_up.4.weightF16[6144 16384]
-
blk.53.ffn_gate.5.weightF16[6144 16384]
-
blk.53.ffn_down.5.weightF16[16384 6144]
-
blk.53.ffn_up.5.weightF16[6144 16384]
-
blk.53.ffn_gate.6.weightF16[6144 16384]
-
blk.53.ffn_down.6.weightF16[16384 6144]
-
blk.53.ffn_up.6.weightF16[6144 16384]
-
blk.53.ffn_gate.7.weightF16[6144 16384]
-
blk.53.ffn_down.7.weightF16[16384 6144]
-
blk.53.ffn_gate_inp.weightF16[6144 8]
-
blk.53.attn_k.weightF16[6144 1024]
-
blk.53.attn_output.weightF16[6144 6144]
-
blk.53.attn_q.weightF16[6144 6144]
-
blk.53.attn_v.weightF16[6144 1024]
-
blk.53.ffn_up.7.weightF16[6144 16384]
-
blk.53.attn_norm.weightF32[6144]
-
blk.53.ffn_norm.weightF32[6144]
-
blk.54.ffn_gate.0.weightF16[6144 16384]
-
blk.54.ffn_down.0.weightF16[16384 6144]
-
blk.54.ffn_up.0.weightF16[6144 16384]
-
blk.54.ffn_gate.1.weightF16[6144 16384]
-
blk.54.ffn_down.1.weightF16[16384 6144]
-
blk.54.ffn_up.1.weightF16[6144 16384]
-
blk.54.ffn_gate.2.weightF16[6144 16384]
-
blk.54.ffn_down.2.weightF16[16384 6144]
-
blk.54.ffn_up.2.weightF16[6144 16384]
-
blk.54.ffn_gate.3.weightF16[6144 16384]
-
blk.54.ffn_down.3.weightF16[16384 6144]
-
blk.54.ffn_up.3.weightF16[6144 16384]
-
blk.54.ffn_gate.4.weightF16[6144 16384]
-
blk.54.ffn_down.4.weightF16[16384 6144]
-
blk.54.ffn_up.4.weightF16[6144 16384]
-
blk.54.ffn_gate.5.weightF16[6144 16384]
-
blk.54.ffn_down.5.weightF16[16384 6144]
-
blk.54.ffn_up.5.weightF16[6144 16384]
-
blk.54.ffn_gate.6.weightF16[6144 16384]
-
blk.54.ffn_down.6.weightF16[16384 6144]
-
blk.54.ffn_up.6.weightF16[6144 16384]
-
blk.54.ffn_gate.7.weightF16[6144 16384]
-
blk.54.ffn_gate_inp.weightF16[6144 8]
-
blk.54.attn_k.weightF16[6144 1024]
-
blk.54.attn_output.weightF16[6144 6144]
-
blk.54.attn_q.weightF16[6144 6144]
-
blk.54.attn_v.weightF16[6144 1024]
-
blk.54.ffn_down.7.weightF16[16384 6144]
-
blk.54.ffn_up.7.weightF16[6144 16384]
-
blk.54.attn_norm.weightF32[6144]
-
blk.54.ffn_norm.weightF32[6144]
-
blk.55.ffn_gate.0.weightF16[6144 16384]
-
blk.55.ffn_down.0.weightF16[16384 6144]
-
blk.55.ffn_up.0.weightF16[6144 16384]
-
blk.55.ffn_gate.1.weightF16[6144 16384]
-
blk.55.ffn_down.1.weightF16[16384 6144]
-
blk.55.ffn_up.1.weightF16[6144 16384]
-
blk.55.ffn_gate.2.weightF16[6144 16384]
-
blk.55.ffn_down.2.weightF16[16384 6144]
-
blk.55.ffn_up.2.weightF16[6144 16384]
-
blk.55.ffn_gate.3.weightF16[6144 16384]
-
blk.55.ffn_down.3.weightF16[16384 6144]
-
blk.55.ffn_up.3.weightF16[6144 16384]
-
blk.55.ffn_gate.4.weightF16[6144 16384]
-
blk.55.ffn_down.4.weightF16[16384 6144]
-
blk.55.ffn_up.4.weightF16[6144 16384]
-
blk.55.ffn_gate.5.weightF16[6144 16384]
-
blk.55.ffn_down.5.weightF16[16384 6144]
-
blk.55.ffn_up.5.weightF16[6144 16384]
-
blk.55.ffn_gate.6.weightF16[6144 16384]
-
blk.55.ffn_down.6.weightF16[16384 6144]
-
blk.55.ffn_up.6.weightF16[6144 16384]
-
blk.55.ffn_gate_inp.weightF16[6144 8]
-
blk.55.attn_k.weightF16[6144 1024]
-
blk.55.attn_output.weightF16[6144 6144]
-
blk.55.attn_q.weightF16[6144 6144]
-
blk.55.attn_v.weightF16[6144 1024]
-
blk.55.ffn_gate.7.weightF16[6144 16384]
-
blk.55.ffn_down.7.weightF16[16384 6144]
-
blk.55.ffn_up.7.weightF16[6144 16384]
-
blk.55.attn_norm.weightF32[6144]
-
blk.55.ffn_norm.weightF32[6144]
-
output.weightF16[6144 32000]
-
output_norm.weightF32[6144]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39
blk.40
blk.41
blk.42
blk.43
blk.44
blk.45
blk.46
blk.47
blk.48
blk.49
blk.50
blk.51
blk.52
blk.53
blk.54
blk.55