Versions of command-r using either the default system prompt or the rag/tool use prompt suggested by Cohere.
35B
155 Pulls Updated 5 months ago
d3965f1bd415 · 22GB
-
general.architecturecommand-r
-
general.file_typeQ4_1
-
command-r.attention.head_count64
-
command-r.attention.head_count_kv64
-
command-r.attention.layer_norm_epsilon1e-05
-
command-r.block_count40
-
command-r.context_length131072
-
command-r.embedding_length8192
-
command-r.feed_forward_length22528
-
command-r.logit_scale0.0625
-
command-r.rope.freq_base8e+06
-
command-r.rope.scaling.typenone
-
tokenizer.ggml.add_bos_tokentrue
-
tokenizer.ggml.add_eos_tokenfalse
-
tokenizer.ggml.bos_token_id5
-
tokenizer.ggml.eos_token_id255001
-
tokenizer.ggml.merges[Ġ Ġ Ġ t e r i n Ġ a ...]
-
tokenizer.ggml.modelgpt2
-
tokenizer.ggml.padding_token_id0
-
tokenizer.ggml.token_type[3 3 3 3 3 ...]
-
tokenizer.ggml.tokens[<PAD> <UNK> <CLS> <SEP> <MASK_TOKEN> ...]
-
NameTypeShape
-
token_embd.weightQ6_K[8192 256000]
-
blk.0.attn_k.weightQ4_1[8192 8192]
-
blk.0.attn_output.weightQ4_1[8192 8192]
-
blk.0.attn_q.weightQ4_1[8192 8192]
-
blk.0.attn_v.weightQ4_1[8192 8192]
-
blk.0.attn_norm.weightF32[8192]
-
blk.0.ffn_down.weightQ4_1[22528 8192]
-
blk.0.ffn_gate.weightQ4_1[8192 22528]
-
blk.0.ffn_up.weightQ4_1[8192 22528]
-
blk.1.attn_norm.weightF32[8192]
-
blk.1.ffn_down.weightQ4_1[22528 8192]
-
blk.1.ffn_gate.weightQ4_1[8192 22528]
-
blk.1.ffn_up.weightQ4_1[8192 22528]
-
blk.1.attn_k.weightQ4_1[8192 8192]
-
blk.1.attn_output.weightQ4_1[8192 8192]
-
blk.1.attn_q.weightQ4_1[8192 8192]
-
blk.1.attn_v.weightQ4_1[8192 8192]
-
blk.2.attn_norm.weightF32[8192]
-
blk.2.ffn_down.weightQ4_1[22528 8192]
-
blk.2.ffn_gate.weightQ4_1[8192 22528]
-
blk.2.ffn_up.weightQ4_1[8192 22528]
-
blk.2.attn_k.weightQ4_1[8192 8192]
-
blk.2.attn_output.weightQ4_1[8192 8192]
-
blk.2.attn_q.weightQ4_1[8192 8192]
-
blk.2.attn_v.weightQ4_1[8192 8192]
-
blk.3.attn_k.weightQ4_1[8192 8192]
-
blk.3.attn_output.weightQ4_1[8192 8192]
-
blk.3.attn_q.weightQ4_1[8192 8192]
-
blk.3.attn_v.weightQ4_1[8192 8192]
-
blk.3.attn_norm.weightF32[8192]
-
blk.3.ffn_down.weightQ4_1[22528 8192]
-
blk.3.ffn_gate.weightQ4_1[8192 22528]
-
blk.3.ffn_up.weightQ4_1[8192 22528]
-
blk.4.attn_norm.weightF32[8192]
-
blk.4.ffn_down.weightQ4_1[22528 8192]
-
blk.4.ffn_gate.weightQ4_1[8192 22528]
-
blk.4.ffn_up.weightQ4_1[8192 22528]
-
blk.4.attn_k.weightQ4_1[8192 8192]
-
blk.4.attn_output.weightQ4_1[8192 8192]
-
blk.4.attn_q.weightQ4_1[8192 8192]
-
blk.4.attn_v.weightQ4_1[8192 8192]
-
blk.5.attn_norm.weightF32[8192]
-
blk.5.ffn_down.weightQ4_1[22528 8192]
-
blk.5.ffn_gate.weightQ4_1[8192 22528]
-
blk.5.ffn_up.weightQ4_1[8192 22528]
-
blk.5.attn_k.weightQ4_1[8192 8192]
-
blk.5.attn_output.weightQ4_1[8192 8192]
-
blk.5.attn_q.weightQ4_1[8192 8192]
-
blk.5.attn_v.weightQ4_1[8192 8192]
-
blk.6.attn_k.weightQ4_1[8192 8192]
-
blk.6.attn_output.weightQ4_1[8192 8192]
-
blk.6.attn_q.weightQ4_1[8192 8192]
-
blk.6.attn_v.weightQ4_1[8192 8192]
-
blk.6.attn_norm.weightF32[8192]
-
blk.6.ffn_down.weightQ4_1[22528 8192]
-
blk.6.ffn_gate.weightQ4_1[8192 22528]
-
blk.6.ffn_up.weightQ4_1[8192 22528]
-
blk.7.attn_norm.weightF32[8192]
-
blk.7.ffn_down.weightQ4_1[22528 8192]
-
blk.7.ffn_gate.weightQ4_1[8192 22528]
-
blk.7.ffn_up.weightQ4_1[8192 22528]
-
blk.7.attn_k.weightQ4_1[8192 8192]
-
blk.7.attn_output.weightQ4_1[8192 8192]
-
blk.7.attn_q.weightQ4_1[8192 8192]
-
blk.7.attn_v.weightQ4_1[8192 8192]
-
blk.8.attn_norm.weightF32[8192]
-
blk.8.ffn_down.weightQ4_1[22528 8192]
-
blk.8.ffn_gate.weightQ4_1[8192 22528]
-
blk.8.ffn_up.weightQ4_1[8192 22528]
-
blk.8.attn_k.weightQ4_1[8192 8192]
-
blk.8.attn_output.weightQ4_1[8192 8192]
-
blk.8.attn_q.weightQ4_1[8192 8192]
-
blk.8.attn_v.weightQ4_1[8192 8192]
-
blk.9.attn_k.weightQ4_1[8192 8192]
-
blk.9.attn_output.weightQ4_1[8192 8192]
-
blk.9.attn_q.weightQ4_1[8192 8192]
-
blk.9.attn_v.weightQ4_1[8192 8192]
-
blk.9.attn_norm.weightF32[8192]
-
blk.9.ffn_down.weightQ4_1[22528 8192]
-
blk.9.ffn_gate.weightQ4_1[8192 22528]
-
blk.9.ffn_up.weightQ4_1[8192 22528]
-
blk.10.attn_norm.weightF32[8192]
-
blk.10.ffn_down.weightQ4_1[22528 8192]
-
blk.10.ffn_gate.weightQ4_1[8192 22528]
-
blk.10.ffn_up.weightQ4_1[8192 22528]
-
blk.10.attn_k.weightQ4_1[8192 8192]
-
blk.10.attn_output.weightQ4_1[8192 8192]
-
blk.10.attn_q.weightQ4_1[8192 8192]
-
blk.10.attn_v.weightQ4_1[8192 8192]
-
blk.11.attn_norm.weightF32[8192]
-
blk.11.ffn_down.weightQ4_1[22528 8192]
-
blk.11.ffn_gate.weightQ4_1[8192 22528]
-
blk.11.ffn_up.weightQ4_1[8192 22528]
-
blk.11.attn_k.weightQ4_1[8192 8192]
-
blk.11.attn_output.weightQ4_1[8192 8192]
-
blk.11.attn_q.weightQ4_1[8192 8192]
-
blk.11.attn_v.weightQ4_1[8192 8192]
-
blk.12.attn_k.weightQ4_1[8192 8192]
-
blk.12.attn_output.weightQ4_1[8192 8192]
-
blk.12.attn_q.weightQ4_1[8192 8192]
-
blk.12.attn_v.weightQ4_1[8192 8192]
-
blk.12.attn_norm.weightF32[8192]
-
blk.12.ffn_down.weightQ4_1[22528 8192]
-
blk.12.ffn_gate.weightQ4_1[8192 22528]
-
blk.12.ffn_up.weightQ4_1[8192 22528]
-
blk.13.attn_norm.weightF32[8192]
-
blk.13.ffn_down.weightQ4_1[22528 8192]
-
blk.13.ffn_gate.weightQ4_1[8192 22528]
-
blk.13.ffn_up.weightQ4_1[8192 22528]
-
blk.13.attn_k.weightQ4_1[8192 8192]
-
blk.13.attn_output.weightQ4_1[8192 8192]
-
blk.13.attn_q.weightQ4_1[8192 8192]
-
blk.13.attn_v.weightQ4_1[8192 8192]
-
blk.14.attn_norm.weightF32[8192]
-
blk.14.ffn_down.weightQ4_1[22528 8192]
-
blk.14.ffn_gate.weightQ4_1[8192 22528]
-
blk.14.ffn_up.weightQ4_1[8192 22528]
-
blk.14.attn_k.weightQ4_1[8192 8192]
-
blk.14.attn_output.weightQ4_1[8192 8192]
-
blk.14.attn_q.weightQ4_1[8192 8192]
-
blk.14.attn_v.weightQ4_1[8192 8192]
-
blk.15.attn_k.weightQ4_1[8192 8192]
-
blk.15.attn_output.weightQ4_1[8192 8192]
-
blk.15.attn_q.weightQ4_1[8192 8192]
-
blk.15.attn_v.weightQ4_1[8192 8192]
-
blk.15.attn_norm.weightF32[8192]
-
blk.15.ffn_down.weightQ4_1[22528 8192]
-
blk.15.ffn_gate.weightQ4_1[8192 22528]
-
blk.15.ffn_up.weightQ4_1[8192 22528]
-
blk.16.attn_norm.weightF32[8192]
-
blk.16.ffn_down.weightQ4_1[22528 8192]
-
blk.16.ffn_gate.weightQ4_1[8192 22528]
-
blk.16.ffn_up.weightQ4_1[8192 22528]
-
blk.16.attn_k.weightQ4_1[8192 8192]
-
blk.16.attn_output.weightQ4_1[8192 8192]
-
blk.16.attn_q.weightQ4_1[8192 8192]
-
blk.16.attn_v.weightQ4_1[8192 8192]
-
blk.17.attn_norm.weightF32[8192]
-
blk.17.ffn_down.weightQ4_1[22528 8192]
-
blk.17.ffn_gate.weightQ4_1[8192 22528]
-
blk.17.ffn_up.weightQ4_1[8192 22528]
-
blk.17.attn_k.weightQ4_1[8192 8192]
-
blk.17.attn_output.weightQ4_1[8192 8192]
-
blk.17.attn_q.weightQ4_1[8192 8192]
-
blk.17.attn_v.weightQ4_1[8192 8192]
-
blk.18.attn_k.weightQ4_1[8192 8192]
-
blk.18.attn_output.weightQ4_1[8192 8192]
-
blk.18.attn_q.weightQ4_1[8192 8192]
-
blk.18.attn_v.weightQ4_1[8192 8192]
-
blk.18.attn_norm.weightF32[8192]
-
blk.18.ffn_down.weightQ4_1[22528 8192]
-
blk.18.ffn_gate.weightQ4_1[8192 22528]
-
blk.18.ffn_up.weightQ4_1[8192 22528]
-
blk.19.attn_norm.weightF32[8192]
-
blk.19.ffn_down.weightQ4_1[22528 8192]
-
blk.19.ffn_gate.weightQ4_1[8192 22528]
-
blk.19.ffn_up.weightQ4_1[8192 22528]
-
blk.19.attn_k.weightQ4_1[8192 8192]
-
blk.19.attn_output.weightQ4_1[8192 8192]
-
blk.19.attn_q.weightQ4_1[8192 8192]
-
blk.19.attn_v.weightQ4_1[8192 8192]
-
blk.20.attn_norm.weightF32[8192]
-
blk.20.ffn_down.weightQ4_1[22528 8192]
-
blk.20.ffn_gate.weightQ4_1[8192 22528]
-
blk.20.ffn_up.weightQ4_1[8192 22528]
-
blk.20.attn_k.weightQ4_1[8192 8192]
-
blk.20.attn_output.weightQ4_1[8192 8192]
-
blk.20.attn_q.weightQ4_1[8192 8192]
-
blk.20.attn_v.weightQ4_1[8192 8192]
-
blk.21.attn_k.weightQ4_1[8192 8192]
-
blk.21.attn_output.weightQ4_1[8192 8192]
-
blk.21.attn_q.weightQ4_1[8192 8192]
-
blk.21.attn_v.weightQ4_1[8192 8192]
-
blk.21.attn_norm.weightF32[8192]
-
blk.21.ffn_down.weightQ4_1[22528 8192]
-
blk.21.ffn_gate.weightQ4_1[8192 22528]
-
blk.21.ffn_up.weightQ4_1[8192 22528]
-
blk.22.attn_norm.weightF32[8192]
-
blk.22.ffn_down.weightQ4_1[22528 8192]
-
blk.22.ffn_gate.weightQ4_1[8192 22528]
-
blk.22.ffn_up.weightQ4_1[8192 22528]
-
blk.22.attn_k.weightQ4_1[8192 8192]
-
blk.22.attn_output.weightQ4_1[8192 8192]
-
blk.22.attn_q.weightQ4_1[8192 8192]
-
blk.22.attn_v.weightQ4_1[8192 8192]
-
blk.23.attn_norm.weightF32[8192]
-
blk.23.ffn_down.weightQ4_1[22528 8192]
-
blk.23.ffn_gate.weightQ4_1[8192 22528]
-
blk.23.ffn_up.weightQ4_1[8192 22528]
-
blk.23.attn_k.weightQ4_1[8192 8192]
-
blk.23.attn_output.weightQ4_1[8192 8192]
-
blk.23.attn_q.weightQ4_1[8192 8192]
-
blk.23.attn_v.weightQ4_1[8192 8192]
-
blk.24.attn_k.weightQ4_1[8192 8192]
-
blk.24.attn_output.weightQ4_1[8192 8192]
-
blk.24.attn_q.weightQ4_1[8192 8192]
-
blk.24.attn_v.weightQ4_1[8192 8192]
-
blk.24.attn_norm.weightF32[8192]
-
blk.24.ffn_down.weightQ4_1[22528 8192]
-
blk.24.ffn_gate.weightQ4_1[8192 22528]
-
blk.24.ffn_up.weightQ4_1[8192 22528]
-
blk.25.attn_norm.weightF32[8192]
-
blk.25.ffn_down.weightQ4_1[22528 8192]
-
blk.25.ffn_gate.weightQ4_1[8192 22528]
-
blk.25.ffn_up.weightQ4_1[8192 22528]
-
blk.25.attn_k.weightQ4_1[8192 8192]
-
blk.25.attn_output.weightQ4_1[8192 8192]
-
blk.25.attn_q.weightQ4_1[8192 8192]
-
blk.25.attn_v.weightQ4_1[8192 8192]
-
blk.26.attn_norm.weightF32[8192]
-
blk.26.ffn_down.weightQ4_1[22528 8192]
-
blk.26.ffn_gate.weightQ4_1[8192 22528]
-
blk.26.ffn_up.weightQ4_1[8192 22528]
-
blk.26.attn_k.weightQ4_1[8192 8192]
-
blk.26.attn_output.weightQ4_1[8192 8192]
-
blk.26.attn_q.weightQ4_1[8192 8192]
-
blk.26.attn_v.weightQ4_1[8192 8192]
-
blk.27.attn_k.weightQ4_1[8192 8192]
-
blk.27.attn_output.weightQ4_1[8192 8192]
-
blk.27.attn_q.weightQ4_1[8192 8192]
-
blk.27.attn_v.weightQ4_1[8192 8192]
-
blk.27.attn_norm.weightF32[8192]
-
blk.27.ffn_down.weightQ4_1[22528 8192]
-
blk.27.ffn_gate.weightQ4_1[8192 22528]
-
blk.27.ffn_up.weightQ4_1[8192 22528]
-
blk.28.attn_norm.weightF32[8192]
-
blk.28.ffn_down.weightQ4_1[22528 8192]
-
blk.28.ffn_gate.weightQ4_1[8192 22528]
-
blk.28.ffn_up.weightQ4_1[8192 22528]
-
blk.28.attn_k.weightQ4_1[8192 8192]
-
blk.28.attn_output.weightQ4_1[8192 8192]
-
blk.28.attn_q.weightQ4_1[8192 8192]
-
blk.28.attn_v.weightQ4_1[8192 8192]
-
blk.29.attn_norm.weightF32[8192]
-
blk.29.ffn_down.weightQ4_1[22528 8192]
-
blk.29.ffn_gate.weightQ4_1[8192 22528]
-
blk.29.ffn_up.weightQ4_1[8192 22528]
-
blk.29.attn_k.weightQ4_1[8192 8192]
-
blk.29.attn_output.weightQ4_1[8192 8192]
-
blk.29.attn_q.weightQ4_1[8192 8192]
-
blk.29.attn_v.weightQ4_1[8192 8192]
-
blk.30.attn_k.weightQ4_1[8192 8192]
-
blk.30.attn_output.weightQ4_1[8192 8192]
-
blk.30.attn_q.weightQ4_1[8192 8192]
-
blk.30.attn_v.weightQ4_1[8192 8192]
-
blk.30.attn_norm.weightF32[8192]
-
blk.30.ffn_down.weightQ4_1[22528 8192]
-
blk.30.ffn_gate.weightQ4_1[8192 22528]
-
blk.30.ffn_up.weightQ4_1[8192 22528]
-
blk.31.attn_norm.weightF32[8192]
-
blk.31.ffn_down.weightQ4_1[22528 8192]
-
blk.31.ffn_gate.weightQ4_1[8192 22528]
-
blk.31.ffn_up.weightQ4_1[8192 22528]
-
blk.31.attn_k.weightQ4_1[8192 8192]
-
blk.31.attn_output.weightQ4_1[8192 8192]
-
blk.31.attn_q.weightQ4_1[8192 8192]
-
blk.31.attn_v.weightQ4_1[8192 8192]
-
blk.32.attn_norm.weightF32[8192]
-
blk.32.ffn_down.weightQ4_1[22528 8192]
-
blk.32.ffn_gate.weightQ4_1[8192 22528]
-
blk.32.ffn_up.weightQ4_1[8192 22528]
-
blk.32.attn_k.weightQ4_1[8192 8192]
-
blk.32.attn_output.weightQ4_1[8192 8192]
-
blk.32.attn_q.weightQ4_1[8192 8192]
-
blk.32.attn_v.weightQ4_1[8192 8192]
-
blk.33.attn_k.weightQ4_1[8192 8192]
-
blk.33.attn_output.weightQ4_1[8192 8192]
-
blk.33.attn_q.weightQ4_1[8192 8192]
-
blk.33.attn_v.weightQ4_1[8192 8192]
-
blk.33.attn_norm.weightF32[8192]
-
blk.33.ffn_down.weightQ4_1[22528 8192]
-
blk.33.ffn_gate.weightQ4_1[8192 22528]
-
blk.33.ffn_up.weightQ4_1[8192 22528]
-
blk.34.attn_norm.weightF32[8192]
-
blk.34.ffn_down.weightQ4_1[22528 8192]
-
blk.34.ffn_gate.weightQ4_1[8192 22528]
-
blk.34.ffn_up.weightQ4_1[8192 22528]
-
blk.34.attn_k.weightQ4_1[8192 8192]
-
blk.34.attn_output.weightQ4_1[8192 8192]
-
blk.34.attn_q.weightQ4_1[8192 8192]
-
blk.34.attn_v.weightQ4_1[8192 8192]
-
blk.35.attn_norm.weightF32[8192]
-
blk.35.ffn_down.weightQ4_1[22528 8192]
-
blk.35.ffn_gate.weightQ4_1[8192 22528]
-
blk.35.ffn_up.weightQ4_1[8192 22528]
-
blk.35.attn_k.weightQ4_1[8192 8192]
-
blk.35.attn_output.weightQ4_1[8192 8192]
-
blk.35.attn_q.weightQ4_1[8192 8192]
-
blk.35.attn_v.weightQ4_1[8192 8192]
-
blk.36.attn_k.weightQ4_1[8192 8192]
-
blk.36.attn_output.weightQ4_1[8192 8192]
-
blk.36.attn_q.weightQ4_1[8192 8192]
-
blk.36.attn_v.weightQ4_1[8192 8192]
-
blk.36.attn_norm.weightF32[8192]
-
blk.36.ffn_down.weightQ4_1[22528 8192]
-
blk.36.ffn_gate.weightQ4_1[8192 22528]
-
blk.36.ffn_up.weightQ4_1[8192 22528]
-
blk.37.attn_norm.weightF32[8192]
-
blk.37.ffn_down.weightQ4_1[22528 8192]
-
blk.37.ffn_gate.weightQ4_1[8192 22528]
-
blk.37.ffn_up.weightQ4_1[8192 22528]
-
blk.37.attn_k.weightQ4_1[8192 8192]
-
blk.37.attn_output.weightQ4_1[8192 8192]
-
blk.37.attn_q.weightQ4_1[8192 8192]
-
blk.37.attn_v.weightQ4_1[8192 8192]
-
blk.38.attn_norm.weightF32[8192]
-
blk.38.ffn_down.weightQ4_1[22528 8192]
-
blk.38.ffn_gate.weightQ4_1[8192 22528]
-
blk.38.ffn_up.weightQ4_1[8192 22528]
-
blk.38.attn_k.weightQ4_1[8192 8192]
-
blk.38.attn_output.weightQ4_1[8192 8192]
-
blk.38.attn_q.weightQ4_1[8192 8192]
-
blk.38.attn_v.weightQ4_1[8192 8192]
-
blk.39.attn_k.weightQ4_1[8192 8192]
-
blk.39.attn_output.weightQ4_1[8192 8192]
-
blk.39.attn_q.weightQ4_1[8192 8192]
-
blk.39.attn_v.weightQ4_1[8192 8192]
-
blk.39.attn_norm.weightF32[8192]
-
blk.39.ffn_down.weightQ4_1[22528 8192]
-
blk.39.ffn_gate.weightQ4_1[8192 22528]
-
blk.39.ffn_up.weightQ4_1[8192 22528]
-
output_norm.weightF32[8192]
Metadata
Tensors
blk.0
blk.1
blk.2
blk.3
blk.4
blk.5
blk.6
blk.7
blk.8
blk.9
blk.10
blk.11
blk.12
blk.13
blk.14
blk.15
blk.16
blk.17
blk.18
blk.19
blk.20
blk.21
blk.22
blk.23
blk.24
blk.25
blk.26
blk.27
blk.28
blk.29
blk.30
blk.31
blk.32
blk.33
blk.34
blk.35
blk.36
blk.37
blk.38
blk.39