axolotl-ai-co/romulus-mistral-nemo-12b-simpo finetuned on jondurbin/gutenberg-dpo-v0.1
Tools
12B
16 Pulls Updated 2 weeks ago
e76e69e95465 · 10GB
-
mradermacher.convert_typehf
-
mradermacher.quantize_version2
-
mradermacher.quantized_at2024-08-14T02:24:56+02:00
-
mradermacher.quantized_bymradermacher
-
mradermacher.quantized_ondb1
-
general.architecturellama
-
general.file_typeQ6_K
-
llama.attention.head_count32
-
llama.attention.head_count_kv8
-
llama.attention.key_length128
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.attention.value_length128
-
llama.block_count40
-
llama.context_length1024000
-
llama.embedding_length5120
-
llama.feed_forward_length14336
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+06
-
llama.vocab_size131072
-
tokenizer.ggml.add_bos_tokenfalse
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.add_space_prefixfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id4
-
tokenizer.ggml.merges[Ġ Ġ Ġ t e r i n Ġ ĠĠĠ ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id10
-
tokenizer.ggml.pretekken
-
tokenizer.ggml.token_type[3 3 3 3 3 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> <|im_start|> <|im_end|> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ6_K[5120 131072]
-
blk.0.attn_norm.weightF32[5120]
-
blk.0.ffn_down.weightQ6_K[14336 5120]
-
blk.0.ffn_gate.weightQ6_K[5120 14336]
-
blk.0.ffn_up.weightQ6_K[5120 14336]
-
blk.0.ffn_norm.weightF32[5120]
-
blk.0.attn_k.weightQ6_K[5120 1024]
-
blk.0.attn_output.weightQ6_K[4096 5120]
-
blk.0.attn_q.weightQ6_K[5120 4096]
-
blk.0.attn_v.weightQ6_K[5120 1024]
-
blk.1.attn_norm.weightF32[5120]
-
blk.1.ffn_down.weightQ6_K[14336 5120]
-
blk.1.ffn_gate.weightQ6_K[5120 14336]
-
blk.1.ffn_up.weightQ6_K[5120 14336]
-
blk.1.ffn_norm.weightF32[5120]
-
blk.1.attn_k.weightQ6_K[5120 1024]
-
blk.1.attn_output.weightQ6_K[4096 5120]
-
blk.1.attn_q.weightQ6_K[5120 4096]
-
blk.1.attn_v.weightQ6_K[5120 1024]
-
blk.2.attn_norm.weightF32[5120]
-
blk.2.ffn_down.weightQ6_K[14336 5120]
-
blk.2.ffn_gate.weightQ6_K[5120 14336]
-
blk.2.ffn_up.weightQ6_K[5120 14336]
-
blk.2.ffn_norm.weightF32[5120]
-
blk.2.attn_k.weightQ6_K[5120 1024]
-
blk.2.attn_output.weightQ6_K[4096 5120]
-
blk.2.attn_q.weightQ6_K[5120 4096]
-
blk.2.attn_v.weightQ6_K[5120 1024]
-
blk.3.attn_norm.weightF32[5120]
-
blk.3.ffn_down.weightQ6_K[14336 5120]
-
blk.3.ffn_gate.weightQ6_K[5120 14336]
-
blk.3.ffn_up.weightQ6_K[5120 14336]
-
blk.3.ffn_norm.weightF32[5120]
-
blk.3.attn_k.weightQ6_K[5120 1024]
-
blk.3.attn_output.weightQ6_K[4096 5120]
-
blk.3.attn_q.weightQ6_K[5120 4096]
-
blk.3.attn_v.weightQ6_K[5120 1024]
-
blk.4.attn_norm.weightF32[5120]
-
blk.4.ffn_down.weightQ6_K[14336 5120]
-
blk.4.ffn_gate.weightQ6_K[5120 14336]
-
blk.4.ffn_up.weightQ6_K[5120 14336]
-
blk.4.ffn_norm.weightF32[5120]
-
blk.4.attn_k.weightQ6_K[5120 1024]
-
blk.4.attn_output.weightQ6_K[4096 5120]
-
blk.4.attn_q.weightQ6_K[5120 4096]
-
blk.4.attn_v.weightQ6_K[5120 1024]
-
blk.5.attn_norm.weightF32[5120]
-
blk.5.ffn_down.weightQ6_K[14336 5120]
-
blk.5.ffn_gate.weightQ6_K[5120 14336]
-
blk.5.ffn_up.weightQ6_K[5120 14336]
-
blk.5.ffn_norm.weightF32[5120]
-
blk.5.attn_k.weightQ6_K[5120 1024]
-
blk.5.attn_output.weightQ6_K[4096 5120]
-
blk.5.attn_q.weightQ6_K[5120 4096]
-
blk.5.attn_v.weightQ6_K[5120 1024]
-
blk.6.ffn_gate.weightQ6_K[5120 14336]
-
blk.6.attn_k.weightQ6_K[5120 1024]
-
blk.6.attn_output.weightQ6_K[4096 5120]
-
blk.6.attn_q.weightQ6_K[5120 4096]
-
blk.6.attn_v.weightQ6_K[5120 1024]
-
blk.6.attn_norm.weightF32[5120]
-
blk.6.ffn_down.weightQ6_K[14336 5120]
-
blk.6.ffn_up.weightQ6_K[5120 14336]
-
blk.6.ffn_norm.weightF32[5120]
-
blk.7.attn_norm.weightF32[5120]
-
blk.7.ffn_down.weightQ6_K[14336 5120]
-
blk.7.ffn_gate.weightQ6_K[5120 14336]
-
blk.7.ffn_up.weightQ6_K[5120 14336]
-
blk.7.ffn_norm.weightF32[5120]
-
blk.7.attn_k.weightQ6_K[5120 1024]
-
blk.7.attn_output.weightQ6_K[4096 5120]
-
blk.7.attn_q.weightQ6_K[5120 4096]
-
blk.7.attn_v.weightQ6_K[5120 1024]
-
blk.8.attn_norm.weightF32[5120]
-
blk.8.ffn_down.weightQ6_K[14336 5120]
-
blk.8.ffn_gate.weightQ6_K[5120 14336]
-
blk.8.ffn_up.weightQ6_K[5120 14336]
-
blk.8.ffn_norm.weightF32[5120]
-
blk.8.attn_k.weightQ6_K[5120 1024]
-
blk.8.attn_output.weightQ6_K[4096 5120]
-
blk.8.attn_q.weightQ6_K[5120 4096]
-
blk.8.attn_v.weightQ6_K[5120 1024]
-
blk.9.attn_norm.weightF32[5120]
-
blk.9.ffn_down.weightQ6_K[14336 5120]
-
blk.9.ffn_gate.weightQ6_K[5120 14336]
-
blk.9.ffn_up.weightQ6_K[5120 14336]
-
blk.9.ffn_norm.weightF32[5120]
-
blk.9.attn_k.weightQ6_K[5120 1024]
-
blk.9.attn_output.weightQ6_K[4096 5120]
-
blk.9.attn_q.weightQ6_K[5120 4096]
-
blk.9.attn_v.weightQ6_K[5120 1024]
-
blk.10.attn_norm.weightF32[5120]
-
blk.10.ffn_down.weightQ6_K[14336 5120]
-
blk.10.ffn_gate.weightQ6_K[5120 14336]
-
blk.10.ffn_up.weightQ6_K[5120 14336]
-
blk.10.ffn_norm.weightF32[5120]
-
blk.10.attn_k.weightQ6_K[5120 1024]
-
blk.10.attn_output.weightQ6_K[4096 5120]
-
blk.10.attn_q.weightQ6_K[5120 4096]
-
blk.10.attn_v.weightQ6_K[5120 1024]
-
blk.11.attn_norm.weightF32[5120]
-
blk.11.ffn_down.weightQ6_K[14336 5120]
-
blk.11.ffn_gate.weightQ6_K[5120 14336]
-
blk.11.ffn_up.weightQ6_K[5120 14336]
-
blk.11.ffn_norm.weightF32[5120]
-
blk.11.attn_k.weightQ6_K[5120 1024]
-
blk.11.attn_output.weightQ6_K[4096 5120]
-
blk.11.attn_q.weightQ6_K[5120 4096]
-
blk.11.attn_v.weightQ6_K[5120 1024]
-
blk.12.attn_norm.weightF32[5120]
-
blk.12.ffn_down.weightQ6_K[14336 5120]
-
blk.12.ffn_gate.weightQ6_K[5120 14336]
-
blk.12.ffn_up.weightQ6_K[5120 14336]
-
blk.12.ffn_norm.weightF32[5120]
-
blk.12.attn_k.weightQ6_K[5120 1024]
-
blk.12.attn_output.weightQ6_K[4096 5120]
-
blk.12.attn_q.weightQ6_K[5120 4096]
-
blk.12.attn_v.weightQ6_K[5120 1024]
-
blk.13.attn_norm.weightF32[5120]
-
blk.13.ffn_down.weightQ6_K[14336 5120]
-
blk.13.ffn_gate.weightQ6_K[5120 14336]
-
blk.13.ffn_up.weightQ6_K[5120 14336]
-
blk.13.ffn_norm.weightF32[5120]
-
blk.13.attn_k.weightQ6_K[5120 1024]
-
blk.13.attn_output.weightQ6_K[4096 5120]
-
blk.13.attn_q.weightQ6_K[5120 4096]
-
blk.13.attn_v.weightQ6_K[5120 1024]
-
blk.14.attn_norm.weightF32[5120]
-
blk.14.ffn_down.weightQ6_K[14336 5120]
-
blk.14.ffn_gate.weightQ6_K[5120 14336]
-
blk.14.ffn_up.weightQ6_K[5120 14336]
-
blk.14.ffn_norm.weightF32[5120]
-
blk.14.attn_k.weightQ6_K[5120 1024]
-
blk.14.attn_output.weightQ6_K[4096 5120]
-
blk.14.attn_q.weightQ6_K[5120 4096]
-
blk.14.attn_v.weightQ6_K[5120 1024]
-
blk.15.ffn_gate.weightQ6_K[5120 14336]
-
blk.15.attn_k.weightQ6_K[5120 1024]
-
blk.15.attn_output.weightQ6_K[4096 5120]
-
blk.15.attn_q.weightQ6_K[5120 4096]
-
blk.15.attn_v.weightQ6_K[5120 1024]
-
blk.15.attn_norm.weightF32[5120]
-
blk.15.ffn_down.weightQ6_K[14336 5120]
-
blk.15.ffn_up.weightQ6_K[5120 14336]
-
blk.15.ffn_norm.weightF32[5120]
-
blk.16.attn_norm.weightF32[5120]
-
blk.16.ffn_down.weightQ6_K[14336 5120]
-
blk.16.ffn_gate.weightQ6_K[5120 14336]
-
blk.16.ffn_up.weightQ6_K[5120 14336]
-
blk.16.ffn_norm.weightF32[5120]
-
blk.16.attn_k.weightQ6_K[5120 1024]
-
blk.16.attn_output.weightQ6_K[4096 5120]
-
blk.16.attn_q.weightQ6_K[5120 4096]
-
blk.16.attn_v.weightQ6_K[5120 1024]
-
blk.17.attn_norm.weightF32[5120]
-
blk.17.ffn_down.weightQ6_K[14336 5120]
-
blk.17.ffn_gate.weightQ6_K[5120 14336]
-
blk.17.ffn_up.weightQ6_K[5120 14336]
-
blk.17.ffn_norm.weightF32[5120]
-
blk.17.attn_k.weightQ6_K[5120 1024]
-
blk.17.attn_output.weightQ6_K[4096 5120]
-
blk.17.attn_q.weightQ6_K[5120 4096]
-
blk.17.attn_v.weightQ6_K[5120 1024]
-
blk.18.attn_norm.weightF32[5120]
-
blk.18.ffn_down.weightQ6_K[14336 5120]
-
blk.18.ffn_gate.weightQ6_K[5120 14336]
-
blk.18.ffn_up.weightQ6_K[5120 14336]
-
blk.18.ffn_norm.weightF32[5120]
-
blk.18.attn_k.weightQ6_K[5120 1024]
-
blk.18.attn_output.weightQ6_K[4096 5120]
-
blk.18.attn_q.weightQ6_K[5120 4096]
-
blk.18.attn_v.weightQ6_K[5120 1024]
-
blk.19.attn_norm.weightF32[5120]
-
blk.19.ffn_down.weightQ6_K[14336 5120]
-
blk.19.ffn_gate.weightQ6_K[5120 14336]
-
blk.19.ffn_up.weightQ6_K[5120 14336]
-
blk.19.ffn_norm.weightF32[5120]
-
blk.19.attn_k.weightQ6_K[5120 1024]
-
blk.19.attn_output.weightQ6_K[4096 5120]
-
blk.19.attn_q.weightQ6_K[5120 4096]
-
blk.19.attn_v.weightQ6_K[5120 1024]
-
blk.20.attn_norm.weightF32[5120]
-
blk.20.ffn_down.weightQ6_K[14336 5120]
-
blk.20.ffn_gate.weightQ6_K[5120 14336]
-
blk.20.ffn_up.weightQ6_K[5120 14336]
-
blk.20.ffn_norm.weightF32[5120]
-
blk.20.attn_k.weightQ6_K[5120 1024]
-
blk.20.attn_output.weightQ6_K[4096 5120]
-
blk.20.attn_q.weightQ6_K[5120 4096]
-
blk.20.attn_v.weightQ6_K[5120 1024]
-
blk.21.attn_norm.weightF32[5120]
-
blk.21.ffn_down.weightQ6_K[14336 5120]
-
blk.21.ffn_gate.weightQ6_K[5120 14336]
-
blk.21.ffn_up.weightQ6_K[5120 14336]
-
blk.21.ffn_norm.weightF32[5120]
-
blk.21.attn_k.weightQ6_K[5120 1024]
-
blk.21.attn_output.weightQ6_K[4096 5120]
-
blk.21.attn_q.weightQ6_K[5120 4096]
-
blk.21.attn_v.weightQ6_K[5120 1024]
-
blk.22.attn_norm.weightF32[5120]
-
blk.22.ffn_down.weightQ6_K[14336 5120]
-
blk.22.ffn_gate.weightQ6_K[5120 14336]
-
blk.22.ffn_up.weightQ6_K[5120 14336]
-
blk.22.ffn_norm.weightF32[5120]
-
blk.22.attn_k.weightQ6_K[5120 1024]
-
blk.22.attn_output.weightQ6_K[4096 5120]
-
blk.22.attn_q.weightQ6_K[5120 4096]
-
blk.22.attn_v.weightQ6_K[5120 1024]
-
blk.23.attn_norm.weightF32[5120]
-
blk.23.ffn_down.weightQ6_K[14336 5120]
-
blk.23.ffn_gate.weightQ6_K[5120 14336]
-
blk.23.ffn_up.weightQ6_K[5120 14336]
-
blk.23.ffn_norm.weightF32[5120]
-
blk.23.attn_k.weightQ6_K[5120 1024]
-
blk.23.attn_output.weightQ6_K[4096 5120]
-
blk.23.attn_q.weightQ6_K[5120 4096]
-
blk.23.attn_v.weightQ6_K[5120 1024]
-
blk.24.ffn_gate.weightQ6_K[5120 14336]
-
blk.24.attn_k.weightQ6_K[5120 1024]
-
blk.24.attn_output.weightQ6_K[4096 5120]
-
blk.24.attn_q.weightQ6_K[5120 4096]
-
blk.24.attn_v.weightQ6_K[5120 1024]
-
blk.24.attn_norm.weightF32[5120]
-
blk.24.ffn_down.weightQ6_K[14336 5120]
-
blk.24.ffn_up.weightQ6_K[5120 14336]
-
blk.24.ffn_norm.weightF32[5120]
-
blk.25.attn_norm.weightF32[5120]
-
blk.25.ffn_down.weightQ6_K[14336 5120]
-
blk.25.ffn_gate.weightQ6_K[5120 14336]
-
blk.25.ffn_up.weightQ6_K[5120 14336]
-
blk.25.ffn_norm.weightF32[5120]
-
blk.25.attn_k.weightQ6_K[5120 1024]
-
blk.25.attn_output.weightQ6_K[4096 5120]
-
blk.25.attn_q.weightQ6_K[5120 4096]
-
blk.25.attn_v.weightQ6_K[5120 1024]
-
blk.26.attn_norm.weightF32[5120]
-
blk.26.ffn_down.weightQ6_K[14336 5120]
-
blk.26.ffn_gate.weightQ6_K[5120 14336]
-
blk.26.ffn_up.weightQ6_K[5120 14336]
-
blk.26.ffn_norm.weightF32[5120]
-
blk.26.attn_k.weightQ6_K[5120 1024]
-
blk.26.attn_output.weightQ6_K[4096 5120]
-
blk.26.attn_q.weightQ6_K[5120 4096]
-
blk.26.attn_v.weightQ6_K[5120 1024]
-
blk.27.attn_norm.weightF32[5120]
-
blk.27.ffn_down.weightQ6_K[14336 5120]
-
blk.27.ffn_gate.weightQ6_K[5120 14336]
-
blk.27.ffn_up.weightQ6_K[5120 14336]
-
blk.27.ffn_norm.weightF32[5120]
-
blk.27.attn_k.weightQ6_K[5120 1024]
-
blk.27.attn_output.weightQ6_K[4096 5120]
-
blk.27.attn_q.weightQ6_K[5120 4096]
-
blk.27.attn_v.weightQ6_K[5120 1024]
-
blk.28.attn_norm.weightF32[5120]
-
blk.28.ffn_down.weightQ6_K[14336 5120]
-
blk.28.ffn_gate.weightQ6_K[5120 14336]
-
blk.28.ffn_up.weightQ6_K[5120 14336]
-
blk.28.ffn_norm.weightF32[5120]
-
blk.28.attn_k.weightQ6_K[5120 1024]
-
blk.28.attn_output.weightQ6_K[4096 5120]
-
blk.28.attn_q.weightQ6_K[5120 4096]
-
blk.28.attn_v.weightQ6_K[5120 1024]
-
blk.29.attn_norm.weightF32[5120]
-
blk.29.ffn_down.weightQ6_K[14336 5120]
-
blk.29.ffn_gate.weightQ6_K[5120 14336]
-
blk.29.ffn_up.weightQ6_K[5120 14336]
-
blk.29.ffn_norm.weightF32[5120]
-
blk.29.attn_k.weightQ6_K[5120 1024]
-
blk.29.attn_output.weightQ6_K[4096 5120]
-
blk.29.attn_q.weightQ6_K[5120 4096]
-
blk.29.attn_v.weightQ6_K[5120 1024]
-
blk.30.attn_norm.weightF32[5120]
-
blk.30.ffn_down.weightQ6_K[14336 5120]
-
blk.30.ffn_gate.weightQ6_K[5120 14336]
-
blk.30.ffn_up.weightQ6_K[5120 14336]
-
blk.30.ffn_norm.weightF32[5120]
-
blk.30.attn_k.weightQ6_K[5120 1024]
-
blk.30.attn_output.weightQ6_K[4096 5120]
-
blk.30.attn_q.weightQ6_K[5120 4096]
-
blk.30.attn_v.weightQ6_K[5120 1024]
-
blk.31.attn_norm.weightF32[5120]
-
blk.31.ffn_down.weightQ6_K[14336 5120]
-
blk.31.ffn_gate.weightQ6_K[5120 14336]
-
blk.31.ffn_up.weightQ6_K[5120 14336]
-
blk.31.ffn_norm.weightF32[5120]
-
blk.31.attn_k.weightQ6_K[5120 1024]
-
blk.31.attn_output.weightQ6_K[4096 5120]
-
blk.31.attn_q.weightQ6_K[5120 4096]
-
blk.31.attn_v.weightQ6_K[5120 1024]
-
blk.32.attn_norm.weightF32[5120]
-
blk.32.ffn_down.weightQ6_K[14336 5120]
-
blk.32.ffn_gate.weightQ6_K[5120 14336]
-
blk.32.ffn_up.weightQ6_K[5120 14336]
-
blk.32.ffn_norm.weightF32[5120]
-
blk.32.attn_k.weightQ6_K[5120 1024]
-
blk.32.attn_output.weightQ6_K[4096 5120]
-
blk.32.attn_q.weightQ6_K[5120 4096]
-
blk.32.attn_v.weightQ6_K[5120 1024]
-
blk.33.ffn_gate.weightQ6_K[5120 14336]
-
blk.33.attn_k.weightQ6_K[5120 1024]
-
blk.33.attn_output.weightQ6_K[4096 5120]
-
blk.33.attn_q.weightQ6_K[5120 4096]
-
blk.33.attn_v.weightQ6_K[5120 1024]
-
blk.33.attn_norm.weightF32[5120]
-
blk.33.ffn_down.weightQ6_K[14336 5120]
-
blk.33.ffn_up.weightQ6_K[5120 14336]
-
blk.33.ffn_norm.weightF32[5120]
-
blk.34.attn_norm.weightF32[5120]
-
blk.34.ffn_down.weightQ6_K[14336 5120]
-
blk.34.ffn_gate.weightQ6_K[5120 14336]
-
blk.34.ffn_up.weightQ6_K[5120 14336]
-
blk.34.ffn_norm.weightF32[5120]
-
blk.34.attn_k.weightQ6_K[5120 1024]
-
blk.34.attn_output.weightQ6_K[4096 5120]
-
blk.34.attn_q.weightQ6_K[5120 4096]
-
blk.34.attn_v.weightQ6_K[5120 1024]
-
blk.35.attn_norm.weightF32[5120]
-
blk.35.ffn_down.weightQ6_K[14336 5120]
-
blk.35.ffn_gate.weightQ6_K[5120 14336]
-
blk.35.ffn_up.weightQ6_K[5120 14336]
-
blk.35.ffn_norm.weightF32[5120]
-
blk.35.attn_k.weightQ6_K[5120 1024]
-
blk.35.attn_output.weightQ6_K[4096 5120]
-
blk.35.attn_q.weightQ6_K[5120 4096]
-
blk.35.attn_v.weightQ6_K[5120 1024]
-
blk.36.attn_norm.weightF32[5120]
-
blk.36.ffn_down.weightQ6_K[14336 5120]
-
blk.36.ffn_gate.weightQ6_K[5120 14336]
-
blk.36.ffn_up.weightQ6_K[5120 14336]
-
blk.36.ffn_norm.weightF32[5120]
-
blk.36.attn_k.weightQ6_K[5120 1024]
-
blk.36.attn_output.weightQ6_K[4096 5120]
-
blk.36.attn_q.weightQ6_K[5120 4096]
-
blk.36.attn_v.weightQ6_K[5120 1024]
-
blk.37.attn_norm.weightF32[5120]
-
blk.37.ffn_down.weightQ6_K[14336 5120]
-
blk.37.ffn_gate.weightQ6_K[5120 14336]
-
blk.37.ffn_up.weightQ6_K[5120 14336]
-
blk.37.ffn_norm.weightF32[5120]
-
blk.37.attn_k.weightQ6_K[5120 1024]
-
blk.37.attn_output.weightQ6_K[4096 5120]
-
blk.37.attn_q.weightQ6_K[5120 4096]
-
blk.37.attn_v.weightQ6_K[5120 1024]
-
blk.38.attn_norm.weightF32[5120]
-
blk.38.ffn_down.weightQ6_K[14336 5120]
-
blk.38.ffn_gate.weightQ6_K[5120 14336]
-
blk.38.ffn_up.weightQ6_K[5120 14336]
-
blk.38.ffn_norm.weightF32[5120]
-
blk.38.attn_k.weightQ6_K[5120 1024]
-
blk.38.attn_output.weightQ6_K[4096 5120]
-
blk.38.attn_q.weightQ6_K[5120 4096]
-
blk.38.attn_v.weightQ6_K[5120 1024]
-
blk.39.attn_norm.weightF32[5120]
-
blk.39.ffn_down.weightQ6_K[14336 5120]
-
blk.39.ffn_gate.weightQ6_K[5120 14336]
-
blk.39.ffn_up.weightQ6_K[5120 14336]
-
blk.39.ffn_norm.weightF32[5120]
-
blk.39.attn_k.weightQ6_K[5120 1024]
-
blk.39.attn_output.weightQ6_K[4096 5120]
-
blk.39.attn_q.weightQ6_K[5120 4096]
-
blk.39.attn_v.weightQ6_K[5120 1024]
-
output.weightQ6_K[5120 131072]
-
output_norm.weightF32[5120]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39