A capable large language model for natural language to SQL generation.
7B
1,164 Pulls Updated 6 months ago
eb5d3abdf635 · 4.2GB
-
general.architecturellama
-
general.file_typeQ4_1
-
llama.attention.head_count32
-
llama.attention.head_count_kv32
-
llama.attention.layer_norm_rms_epsilon1e-05
-
llama.block_count32
-
llama.context_length16384
-
llama.embedding_length4096
-
llama.feed_forward_length11008
-
llama.rope.dimension_count128
-
llama.rope.freq_base1e+06
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id1
-
tokenizer.ggml.eos_token_id2
-
tokenizer.ggml.modelllama
-
tokenizer.ggml.scores[0 0 0 0 0 ...]
-
tokenizer.ggml.token_type[2 3 3 6 6 ...]
-
tokenizer.ggml.tokens[<unk> <s> </s> <0x00> <0x01> ...]
-
tokenizer.ggml.unknown_token_id0
-
NameTypeShape
-
token_embd.weightQ4_1[4096 32016]
-
blk.0.attn_norm.weightF32[4096]
-
blk.0.ffn_down.weightQ4_1[11008 4096]
-
blk.0.ffn_gate.weightQ4_1[4096 11008]
-
blk.0.ffn_up.weightQ4_1[4096 11008]
-
blk.0.ffn_norm.weightF32[4096]
-
blk.0.attn_k.weightQ4_1[4096 4096]
-
blk.0.attn_output.weightQ4_1[4096 4096]
-
blk.0.attn_q.weightQ4_1[4096 4096]
-
blk.0.attn_v.weightQ4_1[4096 4096]
-
blk.1.attn_norm.weightF32[4096]
-
blk.1.ffn_down.weightQ4_1[11008 4096]
-
blk.1.ffn_gate.weightQ4_1[4096 11008]
-
blk.1.ffn_up.weightQ4_1[4096 11008]
-
blk.1.ffn_norm.weightF32[4096]
-
blk.1.attn_k.weightQ4_1[4096 4096]
-
blk.1.attn_output.weightQ4_1[4096 4096]
-
blk.1.attn_q.weightQ4_1[4096 4096]
-
blk.1.attn_v.weightQ4_1[4096 4096]
-
blk.2.attn_norm.weightF32[4096]
-
blk.2.ffn_down.weightQ4_1[11008 4096]
-
blk.2.ffn_gate.weightQ4_1[4096 11008]
-
blk.2.ffn_up.weightQ4_1[4096 11008]
-
blk.2.ffn_norm.weightF32[4096]
-
blk.2.attn_k.weightQ4_1[4096 4096]
-
blk.2.attn_output.weightQ4_1[4096 4096]
-
blk.2.attn_q.weightQ4_1[4096 4096]
-
blk.2.attn_v.weightQ4_1[4096 4096]
-
blk.3.attn_norm.weightF32[4096]
-
blk.3.ffn_down.weightQ4_1[11008 4096]
-
blk.3.ffn_gate.weightQ4_1[4096 11008]
-
blk.3.ffn_up.weightQ4_1[4096 11008]
-
blk.3.ffn_norm.weightF32[4096]
-
blk.3.attn_k.weightQ4_1[4096 4096]
-
blk.3.attn_output.weightQ4_1[4096 4096]
-
blk.3.attn_q.weightQ4_1[4096 4096]
-
blk.3.attn_v.weightQ4_1[4096 4096]
-
blk.4.attn_norm.weightF32[4096]
-
blk.4.ffn_down.weightQ4_1[11008 4096]
-
blk.4.ffn_gate.weightQ4_1[4096 11008]
-
blk.4.ffn_up.weightQ4_1[4096 11008]
-
blk.4.ffn_norm.weightF32[4096]
-
blk.4.attn_k.weightQ4_1[4096 4096]
-
blk.4.attn_output.weightQ4_1[4096 4096]
-
blk.4.attn_q.weightQ4_1[4096 4096]
-
blk.4.attn_v.weightQ4_1[4096 4096]
-
blk.5.attn_norm.weightF32[4096]
-
blk.5.ffn_down.weightQ4_1[11008 4096]
-
blk.5.ffn_gate.weightQ4_1[4096 11008]
-
blk.5.ffn_up.weightQ4_1[4096 11008]
-
blk.5.ffn_norm.weightF32[4096]
-
blk.5.attn_k.weightQ4_1[4096 4096]
-
blk.5.attn_output.weightQ4_1[4096 4096]
-
blk.5.attn_q.weightQ4_1[4096 4096]
-
blk.5.attn_v.weightQ4_1[4096 4096]
-
blk.6.attn_norm.weightF32[4096]
-
blk.6.ffn_down.weightQ4_1[11008 4096]
-
blk.6.ffn_gate.weightQ4_1[4096 11008]
-
blk.6.ffn_up.weightQ4_1[4096 11008]
-
blk.6.ffn_norm.weightF32[4096]
-
blk.6.attn_k.weightQ4_1[4096 4096]
-
blk.6.attn_output.weightQ4_1[4096 4096]
-
blk.6.attn_q.weightQ4_1[4096 4096]
-
blk.6.attn_v.weightQ4_1[4096 4096]
-
blk.7.attn_norm.weightF32[4096]
-
blk.7.ffn_down.weightQ4_1[11008 4096]
-
blk.7.ffn_gate.weightQ4_1[4096 11008]
-
blk.7.ffn_up.weightQ4_1[4096 11008]
-
blk.7.ffn_norm.weightF32[4096]
-
blk.7.attn_k.weightQ4_1[4096 4096]
-
blk.7.attn_output.weightQ4_1[4096 4096]
-
blk.7.attn_q.weightQ4_1[4096 4096]
-
blk.7.attn_v.weightQ4_1[4096 4096]
-
blk.8.attn_norm.weightF32[4096]
-
blk.8.ffn_down.weightQ4_1[11008 4096]
-
blk.8.ffn_gate.weightQ4_1[4096 11008]
-
blk.8.ffn_up.weightQ4_1[4096 11008]
-
blk.8.ffn_norm.weightF32[4096]
-
blk.8.attn_k.weightQ4_1[4096 4096]
-
blk.8.attn_output.weightQ4_1[4096 4096]
-
blk.8.attn_q.weightQ4_1[4096 4096]
-
blk.8.attn_v.weightQ4_1[4096 4096]
-
blk.9.attn_norm.weightF32[4096]
-
blk.9.ffn_down.weightQ4_1[11008 4096]
-
blk.9.ffn_gate.weightQ4_1[4096 11008]
-
blk.9.ffn_up.weightQ4_1[4096 11008]
-
blk.9.ffn_norm.weightF32[4096]
-
blk.9.attn_k.weightQ4_1[4096 4096]
-
blk.9.attn_output.weightQ4_1[4096 4096]
-
blk.9.attn_q.weightQ4_1[4096 4096]
-
blk.9.attn_v.weightQ4_1[4096 4096]
-
blk.10.attn_norm.weightF32[4096]
-
blk.10.ffn_down.weightQ4_1[11008 4096]
-
blk.10.ffn_gate.weightQ4_1[4096 11008]
-
blk.10.ffn_up.weightQ4_1[4096 11008]
-
blk.10.ffn_norm.weightF32[4096]
-
blk.10.attn_k.weightQ4_1[4096 4096]
-
blk.10.attn_output.weightQ4_1[4096 4096]
-
blk.10.attn_q.weightQ4_1[4096 4096]
-
blk.10.attn_v.weightQ4_1[4096 4096]
-
blk.11.ffn_gate.weightQ4_1[4096 11008]
-
blk.11.attn_k.weightQ4_1[4096 4096]
-
blk.11.attn_output.weightQ4_1[4096 4096]
-
blk.11.attn_q.weightQ4_1[4096 4096]
-
blk.11.attn_v.weightQ4_1[4096 4096]
-
blk.11.attn_norm.weightF32[4096]
-
blk.11.ffn_down.weightQ4_1[11008 4096]
-
blk.11.ffn_up.weightQ4_1[4096 11008]
-
blk.11.ffn_norm.weightF32[4096]
-
blk.12.attn_norm.weightF32[4096]
-
blk.12.ffn_down.weightQ4_1[11008 4096]
-
blk.12.ffn_gate.weightQ4_1[4096 11008]
-
blk.12.ffn_up.weightQ4_1[4096 11008]
-
blk.12.ffn_norm.weightF32[4096]
-
blk.12.attn_k.weightQ4_1[4096 4096]
-
blk.12.attn_output.weightQ4_1[4096 4096]
-
blk.12.attn_q.weightQ4_1[4096 4096]
-
blk.12.attn_v.weightQ4_1[4096 4096]
-
blk.13.attn_norm.weightF32[4096]
-
blk.13.ffn_down.weightQ4_1[11008 4096]
-
blk.13.ffn_gate.weightQ4_1[4096 11008]
-
blk.13.ffn_up.weightQ4_1[4096 11008]
-
blk.13.ffn_norm.weightF32[4096]
-
blk.13.attn_k.weightQ4_1[4096 4096]
-
blk.13.attn_output.weightQ4_1[4096 4096]
-
blk.13.attn_q.weightQ4_1[4096 4096]
-
blk.13.attn_v.weightQ4_1[4096 4096]
-
blk.14.attn_norm.weightF32[4096]
-
blk.14.ffn_down.weightQ4_1[11008 4096]
-
blk.14.ffn_gate.weightQ4_1[4096 11008]
-
blk.14.ffn_up.weightQ4_1[4096 11008]
-
blk.14.ffn_norm.weightF32[4096]
-
blk.14.attn_k.weightQ4_1[4096 4096]
-
blk.14.attn_output.weightQ4_1[4096 4096]
-
blk.14.attn_q.weightQ4_1[4096 4096]
-
blk.14.attn_v.weightQ4_1[4096 4096]
-
blk.15.attn_norm.weightF32[4096]
-
blk.15.ffn_down.weightQ4_1[11008 4096]
-
blk.15.ffn_gate.weightQ4_1[4096 11008]
-
blk.15.ffn_up.weightQ4_1[4096 11008]
-
blk.15.ffn_norm.weightF32[4096]
-
blk.15.attn_k.weightQ4_1[4096 4096]
-
blk.15.attn_output.weightQ4_1[4096 4096]
-
blk.15.attn_q.weightQ4_1[4096 4096]
-
blk.15.attn_v.weightQ4_1[4096 4096]
-
blk.16.attn_norm.weightF32[4096]
-
blk.16.ffn_down.weightQ4_1[11008 4096]
-
blk.16.ffn_gate.weightQ4_1[4096 11008]
-
blk.16.ffn_up.weightQ4_1[4096 11008]
-
blk.16.ffn_norm.weightF32[4096]
-
blk.16.attn_k.weightQ4_1[4096 4096]
-
blk.16.attn_output.weightQ4_1[4096 4096]
-
blk.16.attn_q.weightQ4_1[4096 4096]
-
blk.16.attn_v.weightQ4_1[4096 4096]
-
blk.17.attn_norm.weightF32[4096]
-
blk.17.ffn_down.weightQ4_1[11008 4096]
-
blk.17.ffn_gate.weightQ4_1[4096 11008]
-
blk.17.ffn_up.weightQ4_1[4096 11008]
-
blk.17.ffn_norm.weightF32[4096]
-
blk.17.attn_k.weightQ4_1[4096 4096]
-
blk.17.attn_output.weightQ4_1[4096 4096]
-
blk.17.attn_q.weightQ4_1[4096 4096]
-
blk.17.attn_v.weightQ4_1[4096 4096]
-
blk.18.attn_norm.weightF32[4096]
-
blk.18.ffn_down.weightQ4_1[11008 4096]
-
blk.18.ffn_gate.weightQ4_1[4096 11008]
-
blk.18.ffn_up.weightQ4_1[4096 11008]
-
blk.18.ffn_norm.weightF32[4096]
-
blk.18.attn_k.weightQ4_1[4096 4096]
-
blk.18.attn_output.weightQ4_1[4096 4096]
-
blk.18.attn_q.weightQ4_1[4096 4096]
-
blk.18.attn_v.weightQ4_1[4096 4096]
-
blk.19.attn_norm.weightF32[4096]
-
blk.19.ffn_down.weightQ4_1[11008 4096]
-
blk.19.ffn_gate.weightQ4_1[4096 11008]
-
blk.19.ffn_up.weightQ4_1[4096 11008]
-
blk.19.ffn_norm.weightF32[4096]
-
blk.19.attn_k.weightQ4_1[4096 4096]
-
blk.19.attn_output.weightQ4_1[4096 4096]
-
blk.19.attn_q.weightQ4_1[4096 4096]
-
blk.19.attn_v.weightQ4_1[4096 4096]
-
blk.20.attn_norm.weightF32[4096]
-
blk.20.ffn_down.weightQ4_1[11008 4096]
-
blk.20.ffn_gate.weightQ4_1[4096 11008]
-
blk.20.ffn_up.weightQ4_1[4096 11008]
-
blk.20.ffn_norm.weightF32[4096]
-
blk.20.attn_k.weightQ4_1[4096 4096]
-
blk.20.attn_output.weightQ4_1[4096 4096]
-
blk.20.attn_q.weightQ4_1[4096 4096]
-
blk.20.attn_v.weightQ4_1[4096 4096]
-
blk.21.attn_norm.weightF32[4096]
-
blk.21.ffn_down.weightQ4_1[11008 4096]
-
blk.21.ffn_gate.weightQ4_1[4096 11008]
-
blk.21.ffn_up.weightQ4_1[4096 11008]
-
blk.21.ffn_norm.weightF32[4096]
-
blk.21.attn_k.weightQ4_1[4096 4096]
-
blk.21.attn_output.weightQ4_1[4096 4096]
-
blk.21.attn_q.weightQ4_1[4096 4096]
-
blk.21.attn_v.weightQ4_1[4096 4096]
-
blk.22.attn_norm.weightF32[4096]
-
blk.22.ffn_down.weightQ4_1[11008 4096]
-
blk.22.ffn_gate.weightQ4_1[4096 11008]
-
blk.22.ffn_up.weightQ4_1[4096 11008]
-
blk.22.ffn_norm.weightF32[4096]
-
blk.22.attn_k.weightQ4_1[4096 4096]
-
blk.22.attn_output.weightQ4_1[4096 4096]
-
blk.22.attn_q.weightQ4_1[4096 4096]
-
blk.22.attn_v.weightQ4_1[4096 4096]
-
blk.23.ffn_gate.weightQ4_1[4096 11008]
-
blk.23.ffn_up.weightQ4_1[4096 11008]
-
blk.23.attn_k.weightQ4_1[4096 4096]
-
blk.23.attn_output.weightQ4_1[4096 4096]
-
blk.23.attn_q.weightQ4_1[4096 4096]
-
blk.23.attn_v.weightQ4_1[4096 4096]
-
blk.23.attn_norm.weightF32[4096]
-
blk.23.ffn_down.weightQ4_1[11008 4096]
-
blk.23.ffn_norm.weightF32[4096]
-
blk.24.attn_norm.weightF32[4096]
-
blk.24.ffn_down.weightQ4_1[11008 4096]
-
blk.24.ffn_gate.weightQ4_1[4096 11008]
-
blk.24.ffn_up.weightQ4_1[4096 11008]
-
blk.24.ffn_norm.weightF32[4096]
-
blk.24.attn_k.weightQ4_1[4096 4096]
-
blk.24.attn_output.weightQ4_1[4096 4096]
-
blk.24.attn_q.weightQ4_1[4096 4096]
-
blk.24.attn_v.weightQ4_1[4096 4096]
-
blk.25.attn_norm.weightF32[4096]
-
blk.25.ffn_down.weightQ4_1[11008 4096]
-
blk.25.ffn_gate.weightQ4_1[4096 11008]
-
blk.25.ffn_up.weightQ4_1[4096 11008]
-
blk.25.ffn_norm.weightF32[4096]
-
blk.25.attn_k.weightQ4_1[4096 4096]
-
blk.25.attn_output.weightQ4_1[4096 4096]
-
blk.25.attn_q.weightQ4_1[4096 4096]
-
blk.25.attn_v.weightQ4_1[4096 4096]
-
blk.26.attn_norm.weightF32[4096]
-
blk.26.ffn_down.weightQ4_1[11008 4096]
-
blk.26.ffn_gate.weightQ4_1[4096 11008]
-
blk.26.ffn_up.weightQ4_1[4096 11008]
-
blk.26.ffn_norm.weightF32[4096]
-
blk.26.attn_k.weightQ4_1[4096 4096]
-
blk.26.attn_output.weightQ4_1[4096 4096]
-
blk.26.attn_q.weightQ4_1[4096 4096]
-
blk.26.attn_v.weightQ4_1[4096 4096]
-
blk.27.attn_norm.weightF32[4096]
-
blk.27.ffn_down.weightQ4_1[11008 4096]
-
blk.27.ffn_gate.weightQ4_1[4096 11008]
-
blk.27.ffn_up.weightQ4_1[4096 11008]
-
blk.27.ffn_norm.weightF32[4096]
-
blk.27.attn_k.weightQ4_1[4096 4096]
-
blk.27.attn_output.weightQ4_1[4096 4096]
-
blk.27.attn_q.weightQ4_1[4096 4096]
-
blk.27.attn_v.weightQ4_1[4096 4096]
-
blk.28.attn_norm.weightF32[4096]
-
blk.28.ffn_down.weightQ4_1[11008 4096]
-
blk.28.ffn_gate.weightQ4_1[4096 11008]
-
blk.28.ffn_up.weightQ4_1[4096 11008]
-
blk.28.ffn_norm.weightF32[4096]
-
blk.28.attn_k.weightQ4_1[4096 4096]
-
blk.28.attn_output.weightQ4_1[4096 4096]
-
blk.28.attn_q.weightQ4_1[4096 4096]
-
blk.28.attn_v.weightQ4_1[4096 4096]
-
blk.29.attn_norm.weightF32[4096]
-
blk.29.ffn_down.weightQ4_1[11008 4096]
-
blk.29.ffn_gate.weightQ4_1[4096 11008]
-
blk.29.ffn_up.weightQ4_1[4096 11008]
-
blk.29.ffn_norm.weightF32[4096]
-
blk.29.attn_k.weightQ4_1[4096 4096]
-
blk.29.attn_output.weightQ4_1[4096 4096]
-
blk.29.attn_q.weightQ4_1[4096 4096]
-
blk.29.attn_v.weightQ4_1[4096 4096]
-
blk.30.attn_norm.weightF32[4096]
-
blk.30.ffn_down.weightQ4_1[11008 4096]
-
blk.30.ffn_gate.weightQ4_1[4096 11008]
-
blk.30.ffn_up.weightQ4_1[4096 11008]
-
blk.30.ffn_norm.weightF32[4096]
-
blk.30.attn_k.weightQ4_1[4096 4096]
-
blk.30.attn_output.weightQ4_1[4096 4096]
-
blk.30.attn_q.weightQ4_1[4096 4096]
-
blk.30.attn_v.weightQ4_1[4096 4096]
-
blk.31.attn_norm.weightF32[4096]
-
blk.31.ffn_down.weightQ4_1[11008 4096]
-
blk.31.ffn_gate.weightQ4_1[4096 11008]
-
blk.31.ffn_up.weightQ4_1[4096 11008]
-
blk.31.ffn_norm.weightF32[4096]
-
blk.31.attn_k.weightQ4_1[4096 4096]
-
blk.31.attn_output.weightQ4_1[4096 4096]
-
blk.31.attn_q.weightQ4_1[4096 4096]
-
blk.31.attn_v.weightQ4_1[4096 4096]
-
output.weightQ6_K[4096 32016]
-
output_norm.weightF32[4096]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31