StarCoder2 - Code assistant (fine-tuned) 15b model quantized to fit 16gb VRAM
187 Pulls Updated 5 months ago
9d2ec50bbaf4 · 13GB
-
general.architecturestarcoder2
-
general.file_typeQ6_K
-
starcoder2.attention.head_count48
-
starcoder2.attention.head_count_kv4
-
starcoder2.attention.layer_norm_epsilon1e-05
-
starcoder2.block_count40
-
starcoder2.context_length16384
-
starcoder2.embedding_length6144
-
starcoder2.feed_forward_length24576
-
starcoder2.rope.freq_base100000
-
tokenizer.ggml.bos_token_id49152
-
tokenizer.ggml.eos_token_id49153
-
tokenizer.ggml.merges[Ġ Ġ ĠĠ ĠĠ ĠĠĠĠ ĠĠĠĠ ĠĠ Ġ e r ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id49153
-
tokenizer.ggml.token_type[3 3 3 3 3 ...]
-
tokenizer.ggml.tokens[<|endoftext|> <fim_prefix> <fim_middle> <fim_suffix> <fim_pad> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ6_K[6144 49154]
-
blk.0.attn_norm.biasF32[6144]
-
blk.0.attn_norm.weightF32[6144]
-
blk.0.ffn_up.biasF32[24576]
-
blk.0.ffn_up.weightQ6_K[6144 24576]
-
blk.0.ffn_down.biasF32[6144]
-
blk.0.ffn_down.weightQ6_K[24576 6144]
-
blk.0.ffn_norm.biasF32[6144]
-
blk.0.ffn_norm.weightF32[6144]
-
blk.0.attn_k.biasF32[512]
-
blk.0.attn_k.weightQ6_K[6144 512]
-
blk.0.attn_output.biasF32[6144]
-
blk.0.attn_output.weightQ6_K[6144 6144]
-
blk.0.attn_q.biasF32[6144]
-
blk.0.attn_q.weightQ6_K[6144 6144]
-
blk.0.attn_v.biasF32[512]
-
blk.0.attn_v.weightQ6_K[6144 512]
-
blk.1.attn_norm.biasF32[6144]
-
blk.1.attn_norm.weightF32[6144]
-
blk.1.ffn_up.biasF32[24576]
-
blk.1.ffn_up.weightQ6_K[6144 24576]
-
blk.1.ffn_down.biasF32[6144]
-
blk.1.ffn_down.weightQ6_K[24576 6144]
-
blk.1.ffn_norm.biasF32[6144]
-
blk.1.ffn_norm.weightF32[6144]
-
blk.1.attn_k.biasF32[512]
-
blk.1.attn_k.weightQ6_K[6144 512]
-
blk.1.attn_output.biasF32[6144]
-
blk.1.attn_output.weightQ6_K[6144 6144]
-
blk.1.attn_q.biasF32[6144]
-
blk.1.attn_q.weightQ6_K[6144 6144]
-
blk.1.attn_v.biasF32[512]
-
blk.1.attn_v.weightQ6_K[6144 512]
-
blk.2.attn_norm.biasF32[6144]
-
blk.2.attn_norm.weightF32[6144]
-
blk.2.ffn_up.biasF32[24576]
-
blk.2.ffn_up.weightQ6_K[6144 24576]
-
blk.2.ffn_down.biasF32[6144]
-
blk.2.ffn_down.weightQ6_K[24576 6144]
-
blk.2.ffn_norm.biasF32[6144]
-
blk.2.ffn_norm.weightF32[6144]
-
blk.2.attn_k.biasF32[512]
-
blk.2.attn_k.weightQ6_K[6144 512]
-
blk.2.attn_output.biasF32[6144]
-
blk.2.attn_output.weightQ6_K[6144 6144]
-
blk.2.attn_q.biasF32[6144]
-
blk.2.attn_q.weightQ6_K[6144 6144]
-
blk.2.attn_v.biasF32[512]
-
blk.2.attn_v.weightQ6_K[6144 512]
-
blk.3.attn_norm.biasF32[6144]
-
blk.3.attn_norm.weightF32[6144]
-
blk.3.ffn_up.biasF32[24576]
-
blk.3.ffn_up.weightQ6_K[6144 24576]
-
blk.3.ffn_down.biasF32[6144]
-
blk.3.ffn_down.weightQ6_K[24576 6144]
-
blk.3.ffn_norm.biasF32[6144]
-
blk.3.ffn_norm.weightF32[6144]
-
blk.3.attn_k.biasF32[512]
-
blk.3.attn_k.weightQ6_K[6144 512]
-
blk.3.attn_output.biasF32[6144]
-
blk.3.attn_output.weightQ6_K[6144 6144]
-
blk.3.attn_q.biasF32[6144]
-
blk.3.attn_q.weightQ6_K[6144 6144]
-
blk.3.attn_v.biasF32[512]
-
blk.3.attn_v.weightQ6_K[6144 512]
-
blk.4.attn_norm.biasF32[6144]
-
blk.4.attn_norm.weightF32[6144]
-
blk.4.ffn_up.biasF32[24576]
-
blk.4.ffn_up.weightQ6_K[6144 24576]
-
blk.4.ffn_down.biasF32[6144]
-
blk.4.ffn_down.weightQ6_K[24576 6144]
-
blk.4.ffn_norm.biasF32[6144]
-
blk.4.ffn_norm.weightF32[6144]
-
blk.4.attn_k.biasF32[512]
-
blk.4.attn_k.weightQ6_K[6144 512]
-
blk.4.attn_output.biasF32[6144]
-
blk.4.attn_output.weightQ6_K[6144 6144]
-
blk.4.attn_q.biasF32[6144]
-
blk.4.attn_q.weightQ6_K[6144 6144]
-
blk.4.attn_v.biasF32[512]
-
blk.4.attn_v.weightQ6_K[6144 512]
-
blk.5.ffn_up.biasF32[24576]
-
blk.5.ffn_up.weightQ6_K[6144 24576]
-
blk.5.attn_k.biasF32[512]
-
blk.5.attn_k.weightQ6_K[6144 512]
-
blk.5.attn_output.biasF32[6144]
-
blk.5.attn_output.weightQ6_K[6144 6144]
-
blk.5.attn_q.biasF32[6144]
-
blk.5.attn_q.weightQ6_K[6144 6144]
-
blk.5.attn_v.biasF32[512]
-
blk.5.attn_v.weightQ6_K[6144 512]
-
blk.5.attn_norm.biasF32[6144]
-
blk.5.attn_norm.weightF32[6144]
-
blk.5.ffn_down.biasF32[6144]
-
blk.5.ffn_down.weightQ6_K[24576 6144]
-
blk.5.ffn_norm.biasF32[6144]
-
blk.5.ffn_norm.weightF32[6144]
-
blk.6.attn_norm.biasF32[6144]
-
blk.6.attn_norm.weightF32[6144]
-
blk.6.ffn_up.biasF32[24576]
-
blk.6.ffn_up.weightQ6_K[6144 24576]
-
blk.6.ffn_down.biasF32[6144]
-
blk.6.ffn_down.weightQ6_K[24576 6144]
-
blk.6.ffn_norm.biasF32[6144]
-
blk.6.ffn_norm.weightF32[6144]
-
blk.6.attn_k.biasF32[512]
-
blk.6.attn_k.weightQ6_K[6144 512]
-
blk.6.attn_output.biasF32[6144]
-
blk.6.attn_output.weightQ6_K[6144 6144]
-
blk.6.attn_q.biasF32[6144]
-
blk.6.attn_q.weightQ6_K[6144 6144]
-
blk.6.attn_v.biasF32[512]
-
blk.6.attn_v.weightQ6_K[6144 512]
-
blk.7.attn_norm.biasF32[6144]
-
blk.7.attn_norm.weightF32[6144]
-
blk.7.ffn_up.biasF32[24576]
-
blk.7.ffn_up.weightQ6_K[6144 24576]
-
blk.7.ffn_down.biasF32[6144]
-
blk.7.ffn_down.weightQ6_K[24576 6144]
-
blk.7.ffn_norm.biasF32[6144]
-
blk.7.ffn_norm.weightF32[6144]
-
blk.7.attn_k.biasF32[512]
-
blk.7.attn_k.weightQ6_K[6144 512]
-
blk.7.attn_output.biasF32[6144]
-
blk.7.attn_output.weightQ6_K[6144 6144]
-
blk.7.attn_q.biasF32[6144]
-
blk.7.attn_q.weightQ6_K[6144 6144]
-
blk.7.attn_v.biasF32[512]
-
blk.7.attn_v.weightQ6_K[6144 512]
-
blk.8.attn_norm.biasF32[6144]
-
blk.8.attn_norm.weightF32[6144]
-
blk.8.ffn_up.biasF32[24576]
-
blk.8.ffn_up.weightQ6_K[6144 24576]
-
blk.8.ffn_down.biasF32[6144]
-
blk.8.ffn_down.weightQ6_K[24576 6144]
-
blk.8.ffn_norm.biasF32[6144]
-
blk.8.ffn_norm.weightF32[6144]
-
blk.8.attn_k.biasF32[512]
-
blk.8.attn_k.weightQ6_K[6144 512]
-
blk.8.attn_output.biasF32[6144]
-
blk.8.attn_output.weightQ6_K[6144 6144]
-
blk.8.attn_q.biasF32[6144]
-
blk.8.attn_q.weightQ6_K[6144 6144]
-
blk.8.attn_v.biasF32[512]
-
blk.8.attn_v.weightQ6_K[6144 512]
-
blk.9.attn_norm.biasF32[6144]
-
blk.9.attn_norm.weightF32[6144]
-
blk.9.ffn_up.biasF32[24576]
-
blk.9.ffn_up.weightQ6_K[6144 24576]
-
blk.9.ffn_down.biasF32[6144]
-
blk.9.ffn_down.weightQ6_K[24576 6144]
-
blk.9.ffn_norm.biasF32[6144]
-
blk.9.ffn_norm.weightF32[6144]
-
blk.9.attn_k.biasF32[512]
-
blk.9.attn_k.weightQ6_K[6144 512]
-
blk.9.attn_output.biasF32[6144]
-
blk.9.attn_output.weightQ6_K[6144 6144]
-
blk.9.attn_q.biasF32[6144]
-
blk.9.attn_q.weightQ6_K[6144 6144]
-
blk.9.attn_v.biasF32[512]
-
blk.9.attn_v.weightQ6_K[6144 512]
-
blk.10.attn_norm.biasF32[6144]
-
blk.10.attn_norm.weightF32[6144]
-
blk.10.ffn_up.biasF32[24576]
-
blk.10.ffn_up.weightQ6_K[6144 24576]
-
blk.10.ffn_down.biasF32[6144]
-
blk.10.ffn_down.weightQ6_K[24576 6144]
-
blk.10.ffn_norm.biasF32[6144]
-
blk.10.ffn_norm.weightF32[6144]
-
blk.10.attn_k.biasF32[512]
-
blk.10.attn_k.weightQ6_K[6144 512]
-
blk.10.attn_output.biasF32[6144]
-
blk.10.attn_output.weightQ6_K[6144 6144]
-
blk.10.attn_q.biasF32[6144]
-
blk.10.attn_q.weightQ6_K[6144 6144]
-
blk.10.attn_v.biasF32[512]
-
blk.10.attn_v.weightQ6_K[6144 512]
-
blk.11.attn_norm.biasF32[6144]
-
blk.11.attn_norm.weightF32[6144]
-
blk.11.ffn_up.biasF32[24576]
-
blk.11.ffn_up.weightQ6_K[6144 24576]
-
blk.11.ffn_down.biasF32[6144]
-
blk.11.ffn_down.weightQ6_K[24576 6144]
-
blk.11.ffn_norm.biasF32[6144]
-
blk.11.ffn_norm.weightF32[6144]
-
blk.11.attn_k.biasF32[512]
-
blk.11.attn_k.weightQ6_K[6144 512]
-
blk.11.attn_output.biasF32[6144]
-
blk.11.attn_output.weightQ6_K[6144 6144]
-
blk.11.attn_q.biasF32[6144]
-
blk.11.attn_q.weightQ6_K[6144 6144]
-
blk.11.attn_v.biasF32[512]
-
blk.11.attn_v.weightQ6_K[6144 512]
-
blk.12.attn_k.biasF32[512]
-
blk.12.attn_k.weightQ6_K[6144 512]
-
blk.12.attn_q.biasF32[6144]
-
blk.12.attn_q.weightQ6_K[6144 6144]
-
blk.12.attn_v.biasF32[512]
-
blk.12.attn_v.weightQ6_K[6144 512]
-
blk.12.attn_norm.biasF32[6144]
-
blk.12.attn_norm.weightF32[6144]
-
blk.12.ffn_up.biasF32[24576]
-
blk.12.ffn_up.weightQ6_K[6144 24576]
-
blk.12.ffn_down.biasF32[6144]
-
blk.12.ffn_down.weightQ6_K[24576 6144]
-
blk.12.ffn_norm.biasF32[6144]
-
blk.12.ffn_norm.weightF32[6144]
-
blk.12.attn_output.biasF32[6144]
-
blk.12.attn_output.weightQ6_K[6144 6144]
-
blk.13.attn_norm.biasF32[6144]
-
blk.13.attn_norm.weightF32[6144]
-
blk.13.ffn_up.biasF32[24576]
-
blk.13.ffn_up.weightQ6_K[6144 24576]
-
blk.13.ffn_down.biasF32[6144]
-
blk.13.ffn_down.weightQ6_K[24576 6144]
-
blk.13.ffn_norm.biasF32[6144]
-
blk.13.ffn_norm.weightF32[6144]
-
blk.13.attn_k.biasF32[512]
-
blk.13.attn_k.weightQ6_K[6144 512]
-
blk.13.attn_output.biasF32[6144]
-
blk.13.attn_output.weightQ6_K[6144 6144]
-
blk.13.attn_q.biasF32[6144]
-
blk.13.attn_q.weightQ6_K[6144 6144]
-
blk.13.attn_v.biasF32[512]
-
blk.13.attn_v.weightQ6_K[6144 512]
-
blk.14.attn_norm.biasF32[6144]
-
blk.14.attn_norm.weightF32[6144]
-
blk.14.ffn_up.biasF32[24576]
-
blk.14.ffn_up.weightQ6_K[6144 24576]
-
blk.14.ffn_down.biasF32[6144]
-
blk.14.ffn_down.weightQ6_K[24576 6144]
-
blk.14.ffn_norm.biasF32[6144]
-
blk.14.ffn_norm.weightF32[6144]
-
blk.14.attn_k.biasF32[512]
-
blk.14.attn_k.weightQ6_K[6144 512]
-
blk.14.attn_output.biasF32[6144]
-
blk.14.attn_output.weightQ6_K[6144 6144]
-
blk.14.attn_q.biasF32[6144]
-
blk.14.attn_q.weightQ6_K[6144 6144]
-
blk.14.attn_v.biasF32[512]
-
blk.14.attn_v.weightQ6_K[6144 512]
-
blk.15.attn_norm.biasF32[6144]
-
blk.15.attn_norm.weightF32[6144]
-
blk.15.ffn_up.biasF32[24576]
-
blk.15.ffn_up.weightQ6_K[6144 24576]
-
blk.15.ffn_down.biasF32[6144]
-
blk.15.ffn_down.weightQ6_K[24576 6144]
-
blk.15.ffn_norm.biasF32[6144]
-
blk.15.ffn_norm.weightF32[6144]
-
blk.15.attn_k.biasF32[512]
-
blk.15.attn_k.weightQ6_K[6144 512]
-
blk.15.attn_output.biasF32[6144]
-
blk.15.attn_output.weightQ6_K[6144 6144]
-
blk.15.attn_q.biasF32[6144]
-
blk.15.attn_q.weightQ6_K[6144 6144]
-
blk.15.attn_v.biasF32[512]
-
blk.15.attn_v.weightQ6_K[6144 512]
-
blk.16.attn_norm.biasF32[6144]
-
blk.16.attn_norm.weightF32[6144]
-
blk.16.ffn_up.biasF32[24576]
-
blk.16.ffn_up.weightQ6_K[6144 24576]
-
blk.16.ffn_down.biasF32[6144]
-
blk.16.ffn_down.weightQ6_K[24576 6144]
-
blk.16.ffn_norm.biasF32[6144]
-
blk.16.ffn_norm.weightF32[6144]
-
blk.16.attn_k.biasF32[512]
-
blk.16.attn_k.weightQ6_K[6144 512]
-
blk.16.attn_output.biasF32[6144]
-
blk.16.attn_output.weightQ6_K[6144 6144]
-
blk.16.attn_q.biasF32[6144]
-
blk.16.attn_q.weightQ6_K[6144 6144]
-
blk.16.attn_v.biasF32[512]
-
blk.16.attn_v.weightQ6_K[6144 512]
-
blk.17.attn_norm.biasF32[6144]
-
blk.17.attn_norm.weightF32[6144]
-
blk.17.ffn_up.biasF32[24576]
-
blk.17.ffn_up.weightQ6_K[6144 24576]
-
blk.17.ffn_down.biasF32[6144]
-
blk.17.ffn_down.weightQ6_K[24576 6144]
-
blk.17.ffn_norm.biasF32[6144]
-
blk.17.ffn_norm.weightF32[6144]
-
blk.17.attn_k.biasF32[512]
-
blk.17.attn_k.weightQ6_K[6144 512]
-
blk.17.attn_output.biasF32[6144]
-
blk.17.attn_output.weightQ6_K[6144 6144]
-
blk.17.attn_q.biasF32[6144]
-
blk.17.attn_q.weightQ6_K[6144 6144]
-
blk.17.attn_v.biasF32[512]
-
blk.17.attn_v.weightQ6_K[6144 512]
-
blk.18.ffn_up.biasF32[24576]
-
blk.18.ffn_up.weightQ6_K[6144 24576]
-
blk.18.attn_k.biasF32[512]
-
blk.18.attn_k.weightQ6_K[6144 512]
-
blk.18.attn_output.biasF32[6144]
-
blk.18.attn_output.weightQ6_K[6144 6144]
-
blk.18.attn_q.biasF32[6144]
-
blk.18.attn_q.weightQ6_K[6144 6144]
-
blk.18.attn_v.biasF32[512]
-
blk.18.attn_v.weightQ6_K[6144 512]
-
blk.18.attn_norm.biasF32[6144]
-
blk.18.attn_norm.weightF32[6144]
-
blk.18.ffn_down.biasF32[6144]
-
blk.18.ffn_down.weightQ6_K[24576 6144]
-
blk.18.ffn_norm.biasF32[6144]
-
blk.18.ffn_norm.weightF32[6144]
-
blk.19.attn_norm.biasF32[6144]
-
blk.19.attn_norm.weightF32[6144]
-
blk.19.ffn_up.biasF32[24576]
-
blk.19.ffn_up.weightQ6_K[6144 24576]
-
blk.19.ffn_down.biasF32[6144]
-
blk.19.ffn_down.weightQ6_K[24576 6144]
-
blk.19.ffn_norm.biasF32[6144]
-
blk.19.ffn_norm.weightF32[6144]
-
blk.19.attn_k.biasF32[512]
-
blk.19.attn_k.weightQ6_K[6144 512]
-
blk.19.attn_output.biasF32[6144]
-
blk.19.attn_output.weightQ6_K[6144 6144]
-
blk.19.attn_q.biasF32[6144]
-
blk.19.attn_q.weightQ6_K[6144 6144]
-
blk.19.attn_v.biasF32[512]
-
blk.19.attn_v.weightQ6_K[6144 512]
-
blk.20.attn_norm.biasF32[6144]
-
blk.20.attn_norm.weightF32[6144]
-
blk.20.ffn_up.biasF32[24576]
-
blk.20.ffn_up.weightQ6_K[6144 24576]
-
blk.20.ffn_down.biasF32[6144]
-
blk.20.ffn_down.weightQ6_K[24576 6144]
-
blk.20.ffn_norm.biasF32[6144]
-
blk.20.ffn_norm.weightF32[6144]
-
blk.20.attn_k.biasF32[512]
-
blk.20.attn_k.weightQ6_K[6144 512]
-
blk.20.attn_output.biasF32[6144]
-
blk.20.attn_output.weightQ6_K[6144 6144]
-
blk.20.attn_q.biasF32[6144]
-
blk.20.attn_q.weightQ6_K[6144 6144]
-
blk.20.attn_v.biasF32[512]
-
blk.20.attn_v.weightQ6_K[6144 512]
-
blk.21.attn_norm.biasF32[6144]
-
blk.21.attn_norm.weightF32[6144]
-
blk.21.ffn_up.biasF32[24576]
-
blk.21.ffn_up.weightQ6_K[6144 24576]
-
blk.21.ffn_down.biasF32[6144]
-
blk.21.ffn_down.weightQ6_K[24576 6144]
-
blk.21.ffn_norm.biasF32[6144]
-
blk.21.ffn_norm.weightF32[6144]
-
blk.21.attn_k.biasF32[512]
-
blk.21.attn_k.weightQ6_K[6144 512]
-
blk.21.attn_output.biasF32[6144]
-
blk.21.attn_output.weightQ6_K[6144 6144]
-
blk.21.attn_q.biasF32[6144]
-
blk.21.attn_q.weightQ6_K[6144 6144]
-
blk.21.attn_v.biasF32[512]
-
blk.21.attn_v.weightQ6_K[6144 512]
-
blk.22.attn_norm.biasF32[6144]
-
blk.22.attn_norm.weightF32[6144]
-
blk.22.ffn_up.biasF32[24576]
-
blk.22.ffn_up.weightQ6_K[6144 24576]
-
blk.22.ffn_down.biasF32[6144]
-
blk.22.ffn_down.weightQ6_K[24576 6144]
-
blk.22.ffn_norm.biasF32[6144]
-
blk.22.ffn_norm.weightF32[6144]
-
blk.22.attn_k.biasF32[512]
-
blk.22.attn_k.weightQ6_K[6144 512]
-
blk.22.attn_output.biasF32[6144]
-
blk.22.attn_output.weightQ6_K[6144 6144]
-
blk.22.attn_q.biasF32[6144]
-
blk.22.attn_q.weightQ6_K[6144 6144]
-
blk.22.attn_v.biasF32[512]
-
blk.22.attn_v.weightQ6_K[6144 512]
-
blk.23.attn_norm.biasF32[6144]
-
blk.23.attn_norm.weightF32[6144]
-
blk.23.ffn_up.biasF32[24576]
-
blk.23.ffn_up.weightQ6_K[6144 24576]
-
blk.23.ffn_down.biasF32[6144]
-
blk.23.ffn_down.weightQ6_K[24576 6144]
-
blk.23.ffn_norm.biasF32[6144]
-
blk.23.ffn_norm.weightF32[6144]
-
blk.23.attn_k.biasF32[512]
-
blk.23.attn_k.weightQ6_K[6144 512]
-
blk.23.attn_output.biasF32[6144]
-
blk.23.attn_output.weightQ6_K[6144 6144]
-
blk.23.attn_q.biasF32[6144]
-
blk.23.attn_q.weightQ6_K[6144 6144]
-
blk.23.attn_v.biasF32[512]
-
blk.23.attn_v.weightQ6_K[6144 512]
-
blk.24.attn_norm.biasF32[6144]
-
blk.24.attn_norm.weightF32[6144]
-
blk.24.ffn_up.biasF32[24576]
-
blk.24.ffn_up.weightQ6_K[6144 24576]
-
blk.24.ffn_down.biasF32[6144]
-
blk.24.ffn_down.weightQ6_K[24576 6144]
-
blk.24.ffn_norm.biasF32[6144]
-
blk.24.ffn_norm.weightF32[6144]
-
blk.24.attn_k.biasF32[512]
-
blk.24.attn_k.weightQ6_K[6144 512]
-
blk.24.attn_output.biasF32[6144]
-
blk.24.attn_output.weightQ6_K[6144 6144]
-
blk.24.attn_q.biasF32[6144]
-
blk.24.attn_q.weightQ6_K[6144 6144]
-
blk.24.attn_v.biasF32[512]
-
blk.24.attn_v.weightQ6_K[6144 512]
-
blk.25.attn_k.biasF32[512]
-
blk.25.attn_k.weightQ6_K[6144 512]
-
blk.25.attn_q.biasF32[6144]
-
blk.25.attn_q.weightQ6_K[6144 6144]
-
blk.25.attn_v.biasF32[512]
-
blk.25.attn_v.weightQ6_K[6144 512]
-
blk.25.attn_norm.biasF32[6144]
-
blk.25.attn_norm.weightF32[6144]
-
blk.25.ffn_up.biasF32[24576]
-
blk.25.ffn_up.weightQ6_K[6144 24576]
-
blk.25.ffn_down.biasF32[6144]
-
blk.25.ffn_down.weightQ6_K[24576 6144]
-
blk.25.ffn_norm.biasF32[6144]
-
blk.25.ffn_norm.weightF32[6144]
-
blk.25.attn_output.biasF32[6144]
-
blk.25.attn_output.weightQ6_K[6144 6144]
-
blk.26.attn_norm.biasF32[6144]
-
blk.26.attn_norm.weightF32[6144]
-
blk.26.ffn_up.biasF32[24576]
-
blk.26.ffn_up.weightQ6_K[6144 24576]
-
blk.26.ffn_down.biasF32[6144]
-
blk.26.ffn_down.weightQ6_K[24576 6144]
-
blk.26.ffn_norm.biasF32[6144]
-
blk.26.ffn_norm.weightF32[6144]
-
blk.26.attn_k.biasF32[512]
-
blk.26.attn_k.weightQ6_K[6144 512]
-
blk.26.attn_output.biasF32[6144]
-
blk.26.attn_output.weightQ6_K[6144 6144]
-
blk.26.attn_q.biasF32[6144]
-
blk.26.attn_q.weightQ6_K[6144 6144]
-
blk.26.attn_v.biasF32[512]
-
blk.26.attn_v.weightQ6_K[6144 512]
-
blk.27.attn_norm.biasF32[6144]
-
blk.27.attn_norm.weightF32[6144]
-
blk.27.ffn_up.biasF32[24576]
-
blk.27.ffn_up.weightQ6_K[6144 24576]
-
blk.27.ffn_down.biasF32[6144]
-
blk.27.ffn_down.weightQ6_K[24576 6144]
-
blk.27.ffn_norm.biasF32[6144]
-
blk.27.ffn_norm.weightF32[6144]
-
blk.27.attn_k.biasF32[512]
-
blk.27.attn_k.weightQ6_K[6144 512]
-
blk.27.attn_output.biasF32[6144]
-
blk.27.attn_output.weightQ6_K[6144 6144]
-
blk.27.attn_q.biasF32[6144]
-
blk.27.attn_q.weightQ6_K[6144 6144]
-
blk.27.attn_v.biasF32[512]
-
blk.27.attn_v.weightQ6_K[6144 512]
-
blk.28.attn_norm.biasF32[6144]
-
blk.28.attn_norm.weightF32[6144]
-
blk.28.ffn_up.biasF32[24576]
-
blk.28.ffn_up.weightQ6_K[6144 24576]
-
blk.28.ffn_down.biasF32[6144]
-
blk.28.ffn_down.weightQ6_K[24576 6144]
-
blk.28.ffn_norm.biasF32[6144]
-
blk.28.ffn_norm.weightF32[6144]
-
blk.28.attn_k.biasF32[512]
-
blk.28.attn_k.weightQ6_K[6144 512]
-
blk.28.attn_output.biasF32[6144]
-
blk.28.attn_output.weightQ6_K[6144 6144]
-
blk.28.attn_q.biasF32[6144]
-
blk.28.attn_q.weightQ6_K[6144 6144]
-
blk.28.attn_v.biasF32[512]
-
blk.28.attn_v.weightQ6_K[6144 512]
-
blk.29.attn_norm.biasF32[6144]
-
blk.29.attn_norm.weightF32[6144]
-
blk.29.ffn_up.biasF32[24576]
-
blk.29.ffn_up.weightQ6_K[6144 24576]
-
blk.29.ffn_down.biasF32[6144]
-
blk.29.ffn_down.weightQ6_K[24576 6144]
-
blk.29.ffn_norm.biasF32[6144]
-
blk.29.ffn_norm.weightF32[6144]
-
blk.29.attn_k.biasF32[512]
-
blk.29.attn_k.weightQ6_K[6144 512]
-
blk.29.attn_output.biasF32[6144]
-
blk.29.attn_output.weightQ6_K[6144 6144]
-
blk.29.attn_q.biasF32[6144]
-
blk.29.attn_q.weightQ6_K[6144 6144]
-
blk.29.attn_v.biasF32[512]
-
blk.29.attn_v.weightQ6_K[6144 512]
-
blk.30.attn_norm.biasF32[6144]
-
blk.30.attn_norm.weightF32[6144]
-
blk.30.ffn_up.biasF32[24576]
-
blk.30.ffn_up.weightQ6_K[6144 24576]
-
blk.30.ffn_down.biasF32[6144]
-
blk.30.ffn_down.weightQ6_K[24576 6144]
-
blk.30.ffn_norm.biasF32[6144]
-
blk.30.ffn_norm.weightF32[6144]
-
blk.30.attn_k.biasF32[512]
-
blk.30.attn_k.weightQ6_K[6144 512]
-
blk.30.attn_output.biasF32[6144]
-
blk.30.attn_output.weightQ6_K[6144 6144]
-
blk.30.attn_q.biasF32[6144]
-
blk.30.attn_q.weightQ6_K[6144 6144]
-
blk.30.attn_v.biasF32[512]
-
blk.30.attn_v.weightQ6_K[6144 512]
-
blk.31.ffn_up.biasF32[24576]
-
blk.31.ffn_up.weightQ6_K[6144 24576]
-
blk.31.attn_k.biasF32[512]
-
blk.31.attn_k.weightQ6_K[6144 512]
-
blk.31.attn_output.biasF32[6144]
-
blk.31.attn_output.weightQ6_K[6144 6144]
-
blk.31.attn_q.biasF32[6144]
-
blk.31.attn_q.weightQ6_K[6144 6144]
-
blk.31.attn_v.biasF32[512]
-
blk.31.attn_v.weightQ6_K[6144 512]
-
blk.31.attn_norm.biasF32[6144]
-
blk.31.attn_norm.weightF32[6144]
-
blk.31.ffn_down.biasF32[6144]
-
blk.31.ffn_down.weightQ6_K[24576 6144]
-
blk.31.ffn_norm.biasF32[6144]
-
blk.31.ffn_norm.weightF32[6144]
-
blk.32.attn_norm.biasF32[6144]
-
blk.32.attn_norm.weightF32[6144]
-
blk.32.ffn_up.biasF32[24576]
-
blk.32.ffn_up.weightQ6_K[6144 24576]
-
blk.32.ffn_down.biasF32[6144]
-
blk.32.ffn_down.weightQ6_K[24576 6144]
-
blk.32.ffn_norm.biasF32[6144]
-
blk.32.ffn_norm.weightF32[6144]
-
blk.32.attn_k.biasF32[512]
-
blk.32.attn_k.weightQ6_K[6144 512]
-
blk.32.attn_output.biasF32[6144]
-
blk.32.attn_output.weightQ6_K[6144 6144]
-
blk.32.attn_q.biasF32[6144]
-
blk.32.attn_q.weightQ6_K[6144 6144]
-
blk.32.attn_v.biasF32[512]
-
blk.32.attn_v.weightQ6_K[6144 512]
-
blk.33.attn_norm.biasF32[6144]
-
blk.33.attn_norm.weightF32[6144]
-
blk.33.ffn_up.biasF32[24576]
-
blk.33.ffn_up.weightQ6_K[6144 24576]
-
blk.33.ffn_down.biasF32[6144]
-
blk.33.ffn_down.weightQ6_K[24576 6144]
-
blk.33.ffn_norm.biasF32[6144]
-
blk.33.ffn_norm.weightF32[6144]
-
blk.33.attn_k.biasF32[512]
-
blk.33.attn_k.weightQ6_K[6144 512]
-
blk.33.attn_output.biasF32[6144]
-
blk.33.attn_output.weightQ6_K[6144 6144]
-
blk.33.attn_q.biasF32[6144]
-
blk.33.attn_q.weightQ6_K[6144 6144]
-
blk.33.attn_v.biasF32[512]
-
blk.33.attn_v.weightQ6_K[6144 512]
-
blk.34.attn_norm.biasF32[6144]
-
blk.34.attn_norm.weightF32[6144]
-
blk.34.ffn_up.biasF32[24576]
-
blk.34.ffn_up.weightQ6_K[6144 24576]
-
blk.34.ffn_down.biasF32[6144]
-
blk.34.ffn_down.weightQ6_K[24576 6144]
-
blk.34.ffn_norm.biasF32[6144]
-
blk.34.ffn_norm.weightF32[6144]
-
blk.34.attn_k.biasF32[512]
-
blk.34.attn_k.weightQ6_K[6144 512]
-
blk.34.attn_output.biasF32[6144]
-
blk.34.attn_output.weightQ6_K[6144 6144]
-
blk.34.attn_q.biasF32[6144]
-
blk.34.attn_q.weightQ6_K[6144 6144]
-
blk.34.attn_v.biasF32[512]
-
blk.34.attn_v.weightQ6_K[6144 512]
-
blk.35.attn_norm.biasF32[6144]
-
blk.35.attn_norm.weightF32[6144]
-
blk.35.ffn_up.biasF32[24576]
-
blk.35.ffn_up.weightQ6_K[6144 24576]
-
blk.35.ffn_down.biasF32[6144]
-
blk.35.ffn_down.weightQ6_K[24576 6144]
-
blk.35.ffn_norm.biasF32[6144]
-
blk.35.ffn_norm.weightF32[6144]
-
blk.35.attn_k.biasF32[512]
-
blk.35.attn_k.weightQ6_K[6144 512]
-
blk.35.attn_output.biasF32[6144]
-
blk.35.attn_output.weightQ6_K[6144 6144]
-
blk.35.attn_q.biasF32[6144]
-
blk.35.attn_q.weightQ6_K[6144 6144]
-
blk.35.attn_v.biasF32[512]
-
blk.35.attn_v.weightQ6_K[6144 512]
-
blk.36.attn_norm.biasF32[6144]
-
blk.36.attn_norm.weightF32[6144]
-
blk.36.ffn_up.biasF32[24576]
-
blk.36.ffn_up.weightQ6_K[6144 24576]
-
blk.36.ffn_down.biasF32[6144]
-
blk.36.ffn_down.weightQ6_K[24576 6144]
-
blk.36.ffn_norm.biasF32[6144]
-
blk.36.ffn_norm.weightF32[6144]
-
blk.36.attn_k.biasF32[512]
-
blk.36.attn_k.weightQ6_K[6144 512]
-
blk.36.attn_output.biasF32[6144]
-
blk.36.attn_output.weightQ6_K[6144 6144]
-
blk.36.attn_q.biasF32[6144]
-
blk.36.attn_q.weightQ6_K[6144 6144]
-
blk.36.attn_v.biasF32[512]
-
blk.36.attn_v.weightQ6_K[6144 512]
-
blk.37.attn_norm.biasF32[6144]
-
blk.37.attn_norm.weightF32[6144]
-
blk.37.ffn_up.biasF32[24576]
-
blk.37.ffn_up.weightQ6_K[6144 24576]
-
blk.37.ffn_down.biasF32[6144]
-
blk.37.ffn_down.weightQ6_K[24576 6144]
-
blk.37.ffn_norm.biasF32[6144]
-
blk.37.ffn_norm.weightF32[6144]
-
blk.37.attn_k.biasF32[512]
-
blk.37.attn_k.weightQ6_K[6144 512]
-
blk.37.attn_output.biasF32[6144]
-
blk.37.attn_output.weightQ6_K[6144 6144]
-
blk.37.attn_q.biasF32[6144]
-
blk.37.attn_q.weightQ6_K[6144 6144]
-
blk.37.attn_v.biasF32[512]
-
blk.37.attn_v.weightQ6_K[6144 512]
-
blk.38.attn_k.biasF32[512]
-
blk.38.attn_k.weightQ6_K[6144 512]
-
blk.38.attn_q.biasF32[6144]
-
blk.38.attn_q.weightQ6_K[6144 6144]
-
blk.38.attn_v.biasF32[512]
-
blk.38.attn_v.weightQ6_K[6144 512]
-
blk.38.attn_norm.biasF32[6144]
-
blk.38.attn_norm.weightF32[6144]
-
blk.38.ffn_up.biasF32[24576]
-
blk.38.ffn_up.weightQ6_K[6144 24576]
-
blk.38.ffn_down.biasF32[6144]
-
blk.38.ffn_down.weightQ6_K[24576 6144]
-
blk.38.ffn_norm.biasF32[6144]
-
blk.38.ffn_norm.weightF32[6144]
-
blk.38.attn_output.biasF32[6144]
-
blk.38.attn_output.weightQ6_K[6144 6144]
-
blk.39.attn_norm.biasF32[6144]
-
blk.39.attn_norm.weightF32[6144]
-
blk.39.ffn_up.biasF32[24576]
-
blk.39.ffn_up.weightQ6_K[6144 24576]
-
blk.39.ffn_down.biasF32[6144]
-
blk.39.ffn_down.weightQ6_K[24576 6144]
-
blk.39.ffn_norm.biasF32[6144]
-
blk.39.ffn_norm.weightF32[6144]
-
blk.39.attn_k.biasF32[512]
-
blk.39.attn_k.weightQ6_K[6144 512]
-
blk.39.attn_output.biasF32[6144]
-
blk.39.attn_output.weightQ6_K[6144 6144]
-
blk.39.attn_q.biasF32[6144]
-
blk.39.attn_q.weightQ6_K[6144 6144]
-
blk.39.attn_v.biasF32[512]
-
blk.39.attn_v.weightQ6_K[6144 512]
-
output.weightQ6_K[6144 49154]
-
output_norm.biasF32[6144]
-
output_norm.weightF32[6144]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39